WebSVN – QNX 8.QNX8 LLVM/Clang compiler suite – Blame – //llvm-build/x86_64/lib/clang/16/include/cuda_wrappers/complex

Rev	Author	Line No.	Line
14	pmbaty	1	/*===---- complex - CUDA wrapper for <complex> ------------------------------===
		2	*
		3	* Permission is hereby granted, free of charge, to any person obtaining a copy
		4	* of this software and associated documentation files (the "Software"), to deal
		5	* in the Software without restriction, including without limitation the rights
		6	* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
		7	* copies of the Software, and to permit persons to whom the Software is
		8	* furnished to do so, subject to the following conditions:
		9	*
		10	* The above copyright notice and this permission notice shall be included in
		11	* all copies or substantial portions of the Software.
		12	*
		13	* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
		14	* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
		15	* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
		16	* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
		17	* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
		18	* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
		19	* THE SOFTWARE.
		20	*
		21	*===-----------------------------------------------------------------------===
		22	*/
		23
		24	#ifndef __CLANG_CUDA_WRAPPERS_COMPLEX
		25	#define __CLANG_CUDA_WRAPPERS_COMPLEX
		26
		27	// Wrapper around <complex> that forces its functions to be __host__
		28	// __device__.
		29
		30	// First, include host-only headers we think are likely to be included by
		31	// <complex>, so that the pragma below only applies to <complex> itself.
		32	#if __cplusplus >= 201103L
		33	#include <type_traits>
		34	#endif
		35	#include <stdexcept>
		36	#include <cmath>
		37	#include <sstream>
		38
		39	// Next, include our <algorithm> wrapper, to ensure that device overloads of
		40	// std::min/max are available.
		41	#include <algorithm>
		42
		43	#pragma clang force_cuda_host_device begin
		44
		45	// When compiling for device, ask libstdc++ to use its own implements of
		46	// complex functions, rather than calling builtins (which resolve to library
		47	// functions that don't exist when compiling CUDA device code).
		48	//
		49	// This is a little dicey, because it causes libstdc++ to define a different
		50	// set of overloads on host and device.
		51	//
		52	// // Present only when compiling for host.
		53	// __host__ __device__ void complex<float> sin(const complex<float>& x) {
		54	// return __builtin_csinf(x);
		55	// }
		56	//
		57	// // Present when compiling for host and for device.
		58	// template <typename T>
		59	// void __host__ __device__ complex<T> sin(const complex<T>& x) {
		60	// return complex<T>(sin(x.real()) * cosh(x.imag()),
		61	// cos(x.real()), sinh(x.imag()));
		62	// }
		63	//
		64	// This is safe because when compiling for device, all function calls in
		65	// __host__ code to sin() will still resolve to something, even if they don't
		66	// resolve to the same function as they resolve to when compiling for host. We
		67	// don't care that they don't resolve to the right function because we won't
		68	// codegen this host code when compiling for device.
		69
		70	#pragma push_macro("_GLIBCXX_USE_C99_COMPLEX")
		71	#pragma push_macro("_GLIBCXX_USE_C99_COMPLEX_TR1")
		72	#define _GLIBCXX_USE_C99_COMPLEX 0
		73	#define _GLIBCXX_USE_C99_COMPLEX_TR1 0
		74
		75	// Work around a compatibility issue with libstdc++ 11.1.0
		76	// https://bugs.llvm.org/show_bug.cgi?id=50383
		77	#pragma push_macro("__failed_assertion")
		78	#if _GLIBCXX_RELEASE == 11
		79	#define __failed_assertion __cuda_failed_assertion
		80	#endif
		81
		82	#include_next <complex>
		83
		84	#pragma pop_macro("__failed_assertion")
		85	#pragma pop_macro("_GLIBCXX_USE_C99_COMPLEX_TR1")
		86	#pragma pop_macro("_GLIBCXX_USE_C99_COMPLEX")
		87
		88	#pragma clang force_cuda_host_device end
		89
		90	#endif // include guard

Subversion Repositories QNX 8.QNX8 LLVM/Clang compiler suite

QNX 8.QNX8 LLVM/Clang compiler suite//llvm-build/x86_64/lib/clang/16/include/cuda_wrappers/complex – Rev 14