/*===---- complex - CUDA wrapper for <complex> ------------------------------=== * * Permission is hereby granted, free of charge, to any person obtaining a copy * of this software and associated documentation files (the "Software"), to deal * in the Software without restriction, including without limitation the rights * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell * copies of the Software, and to permit persons to whom the Software is * furnished to do so, subject to the following conditions: * * The above copyright notice and this permission notice shall be included in * all copies or substantial portions of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN * THE SOFTWARE. * *===-----------------------------------------------------------------------=== */ #ifndef __CLANG_CUDA_WRAPPERS_COMPLEX #define __CLANG_CUDA_WRAPPERS_COMPLEX // Wrapper around <complex> that forces its functions to be __host__ // __device__. // First, include host-only headers we think are likely to be included by // <complex>, so that the pragma below only applies to <complex> itself. #if __cplusplus >= 201103L #include <type_traits> #endif #include <stdexcept> #include <cmath> #include <sstream> // Next, include our <algorithm> wrapper, to ensure that device overloads of // std::min/max are available. #include <algorithm> #pragma clang force_cuda_host_device begin // When compiling for device, ask libstdc++ to use its own implements of // complex functions, rather than calling builtins (which resolve to library // functions that don't exist when compiling CUDA device code). // // This is a little dicey, because it causes libstdc++ to define a different // set of overloads on host and device. // // // Present only when compiling for host. // __host__ __device__ void complex<float> sin(const complex<float>& x) { // return __builtin_csinf(x); // } // // // Present when compiling for host and for device. // template <typename T> // void __host__ __device__ complex<T> sin(const complex<T>& x) { // return complex<T>(sin(x.real()) * cosh(x.imag()), // cos(x.real()), sinh(x.imag())); // } // // This is safe because when compiling for device, all function calls in // __host__ code to sin() will still resolve to *something*, even if they don't // resolve to the same function as they resolve to when compiling for host. We // don't care that they don't resolve to the right function because we won't // codegen this host code when compiling for device. #pragma push_macro("_GLIBCXX_USE_C99_COMPLEX") #pragma push_macro("_GLIBCXX_USE_C99_COMPLEX_TR1") #define _GLIBCXX_USE_C99_COMPLEX 0 #define _GLIBCXX_USE_C99_COMPLEX_TR1 0 #include_next <complex> #pragma pop_macro("_GLIBCXX_USE_C99_COMPLEX_TR1") #pragma pop_macro("_GLIBCXX_USE_C99_COMPLEX") #pragma clang force_cuda_host_device end #endif // include guard