Subversion Repositories QNX 8.QNX8 LLVM/Clang compiler suite

Rev

Details | Last modification | View Log | RSS feed

Rev Author Line No. Line
14 pmbaty 1
/*===---- complex - CUDA wrapper for <complex> ------------------------------===
2
 *
3
 * Permission is hereby granted, free of charge, to any person obtaining a copy
4
 * of this software and associated documentation files (the "Software"), to deal
5
 * in the Software without restriction, including without limitation the rights
6
 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
7
 * copies of the Software, and to permit persons to whom the Software is
8
 * furnished to do so, subject to the following conditions:
9
 *
10
 * The above copyright notice and this permission notice shall be included in
11
 * all copies or substantial portions of the Software.
12
 *
13
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
14
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
15
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
16
 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
17
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
18
 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
19
 * THE SOFTWARE.
20
 *
21
 *===-----------------------------------------------------------------------===
22
 */
23
 
24
#ifndef __CLANG_CUDA_WRAPPERS_COMPLEX
25
#define __CLANG_CUDA_WRAPPERS_COMPLEX
26
 
27
// Wrapper around <complex> that forces its functions to be __host__
28
// __device__.
29
 
30
// First, include host-only headers we think are likely to be included by
31
// <complex>, so that the pragma below only applies to <complex> itself.
32
#if __cplusplus >= 201103L
33
#include <type_traits>
34
#endif
35
#include <stdexcept>
36
#include <cmath>
37
#include <sstream>
38
 
39
// Next, include our <algorithm> wrapper, to ensure that device overloads of
40
// std::min/max are available.
41
#include <algorithm>
42
 
43
#pragma clang force_cuda_host_device begin
44
 
45
// When compiling for device, ask libstdc++ to use its own implements of
46
// complex functions, rather than calling builtins (which resolve to library
47
// functions that don't exist when compiling CUDA device code).
48
//
49
// This is a little dicey, because it causes libstdc++ to define a different
50
// set of overloads on host and device.
51
//
52
//   // Present only when compiling for host.
53
//   __host__ __device__ void complex<float> sin(const complex<float>& x) {
54
//     return __builtin_csinf(x);
55
//   }
56
//
57
//   // Present when compiling for host and for device.
58
//   template <typename T>
59
//   void __host__ __device__ complex<T> sin(const complex<T>& x) {
60
//     return complex<T>(sin(x.real()) * cosh(x.imag()),
61
//                       cos(x.real()), sinh(x.imag()));
62
//   }
63
//
64
// This is safe because when compiling for device, all function calls in
65
// __host__ code to sin() will still resolve to *something*, even if they don't
66
// resolve to the same function as they resolve to when compiling for host.  We
67
// don't care that they don't resolve to the right function because we won't
68
// codegen this host code when compiling for device.
69
 
70
#pragma push_macro("_GLIBCXX_USE_C99_COMPLEX")
71
#pragma push_macro("_GLIBCXX_USE_C99_COMPLEX_TR1")
72
#define _GLIBCXX_USE_C99_COMPLEX 0
73
#define _GLIBCXX_USE_C99_COMPLEX_TR1 0
74
 
75
// Work around a compatibility issue with libstdc++ 11.1.0
76
// https://bugs.llvm.org/show_bug.cgi?id=50383
77
#pragma push_macro("__failed_assertion")
78
#if _GLIBCXX_RELEASE == 11
79
#define __failed_assertion __cuda_failed_assertion
80
#endif
81
 
82
#include_next <complex>
83
 
84
#pragma pop_macro("__failed_assertion")
85
#pragma pop_macro("_GLIBCXX_USE_C99_COMPLEX_TR1")
86
#pragma pop_macro("_GLIBCXX_USE_C99_COMPLEX")
87
 
88
#pragma clang force_cuda_host_device end
89
 
90
#endif // include guard