1/*===---- complex - CUDA wrapper for <complex> ------------------------------=== 2 * 3 * Permission is hereby granted, free of charge, to any person obtaining a copy 4 * of this software and associated documentation files (the "Software"), to deal 5 * in the Software without restriction, including without limitation the rights 6 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 7 * copies of the Software, and to permit persons to whom the Software is 8 * furnished to do so, subject to the following conditions: 9 * 10 * The above copyright notice and this permission notice shall be included in 11 * all copies or substantial portions of the Software. 12 * 13 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 14 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 15 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE 16 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 17 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 18 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN 19 * THE SOFTWARE. 20 * 21 *===-----------------------------------------------------------------------=== 22 */ 23 24#ifndef __CLANG_CUDA_WRAPPERS_COMPLEX 25#define __CLANG_CUDA_WRAPPERS_COMPLEX 26 27// Wrapper around <complex> that forces its functions to be __host__ 28// __device__. 29 30// First, include host-only headers we think are likely to be included by 31// <complex>, so that the pragma below only applies to <complex> itself. 32#if __cplusplus >= 201103L 33#include <type_traits> 34#endif 35#include <stdexcept> 36#include <cmath> 37#include <sstream> 38 39// Next, include our <algorithm> wrapper, to ensure that device overloads of 40// std::min/max are available. 41#include <algorithm> 42 43#pragma clang force_cuda_host_device begin 44 45// When compiling for device, ask libstdc++ to use its own implements of 46// complex functions, rather than calling builtins (which resolve to library 47// functions that don't exist when compiling CUDA device code). 48// 49// This is a little dicey, because it causes libstdc++ to define a different 50// set of overloads on host and device. 51// 52// // Present only when compiling for host. 53// __host__ __device__ void complex<float> sin(const complex<float>& x) { 54// return __builtin_csinf(x); 55// } 56// 57// // Present when compiling for host and for device. 58// template <typename T> 59// void __host__ __device__ complex<T> sin(const complex<T>& x) { 60// return complex<T>(sin(x.real()) * cosh(x.imag()), 61// cos(x.real()), sinh(x.imag())); 62// } 63// 64// This is safe because when compiling for device, all function calls in 65// __host__ code to sin() will still resolve to *something*, even if they don't 66// resolve to the same function as they resolve to when compiling for host. We 67// don't care that they don't resolve to the right function because we won't 68// codegen this host code when compiling for device. 69 70#pragma push_macro("_GLIBCXX_USE_C99_COMPLEX") 71#pragma push_macro("_GLIBCXX_USE_C99_COMPLEX_TR1") 72#define _GLIBCXX_USE_C99_COMPLEX 0 73#define _GLIBCXX_USE_C99_COMPLEX_TR1 0 74 75// Work around a compatibility issue with libstdc++ 11.1.0 76// https://bugs.llvm.org/show_bug.cgi?id=50383 77#pragma push_macro("__failed_assertion") 78#if _GLIBCXX_RELEASE == 11 79#define __failed_assertion __cuda_failed_assertion 80#endif 81 82#include_next <complex> 83 84#pragma pop_macro("__failed_assertion") 85#pragma pop_macro("_GLIBCXX_USE_C99_COMPLEX_TR1") 86#pragma pop_macro("_GLIBCXX_USE_C99_COMPLEX") 87 88#pragma clang force_cuda_host_device end 89 90#endif // include guard 91