Blame | Last modification | View Log | Download | RSS feed
/*===---- algorithm - CUDA wrapper for <algorithm> -------------------------===** Permission is hereby granted, free of charge, to any person obtaining a copy* of this software and associated documentation files (the "Software"), to deal* in the Software without restriction, including without limitation the rights* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell* copies of the Software, and to permit persons to whom the Software is* furnished to do so, subject to the following conditions:** The above copyright notice and this permission notice shall be included in* all copies or substantial portions of the Software.** THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN* THE SOFTWARE.**===-----------------------------------------------------------------------===*/#ifndef __CLANG_CUDA_WRAPPERS_ALGORITHM#define __CLANG_CUDA_WRAPPERS_ALGORITHM// This header defines __device__ overloads of std::min/max.//// Ideally we'd declare these functions only if we're <= C++11. In C++14,// these functions are constexpr, and so are implicitly __host__ __device__.//// However, the compiler being in C++14 mode does not imply that the standard// library supports C++14. There is no macro we can test to check that the// stdlib has constexpr std::min/max. Thus we have to unconditionally define// our device overloads.//// A host+device function cannot be overloaded, and a constexpr function// implicitly become host device if there's no explicitly host or device// overload preceding it. So the simple thing to do would be to declare our// device min/max overloads, and then #include_next <algorithm>. This way our// device overloads would come first, and so if we have a C++14 stdlib, its// min/max won't become host+device and conflict with our device overloads.//// But that also doesn't work. libstdc++ is evil and declares std::min/max in// an internal header that is included *before* <algorithm>. Thus by the time// we're inside of this file, std::min/max may already have been declared, and// thus we can't prevent them from becoming host+device if they're constexpr.//// Therefore we perpetrate the following hack: We mark our __device__ overloads// with __attribute__((enable_if(true, ""))). This causes the signature of the// function to change without changing anything else about it. (Except that// overload resolution will prefer it over the __host__ __device__ version// rather than considering them equally good).#include_next <algorithm>// We need to define these overloads in exactly the namespace our standard// library uses (including the right inline namespace), otherwise they won't be// picked up by other functions in the standard library (e.g. functions in// <complex>). Thus the ugliness below.#ifdef _LIBCPP_BEGIN_NAMESPACE_STD_LIBCPP_BEGIN_NAMESPACE_STD#elsenamespace std {#ifdef _GLIBCXX_BEGIN_NAMESPACE_VERSION_GLIBCXX_BEGIN_NAMESPACE_VERSION#endif#endif#pragma push_macro("_CPP14_CONSTEXPR")#if __cplusplus >= 201402L#define _CPP14_CONSTEXPR constexpr#else#define _CPP14_CONSTEXPR#endiftemplate <class __T, class __Cmp>__attribute__((enable_if(true, "")))inline _CPP14_CONSTEXPR __host__ __device__ const __T &max(const __T &__a, const __T &__b, __Cmp __cmp) {return __cmp(__a, __b) ? __b : __a;}template <class __T>__attribute__((enable_if(true, "")))inline _CPP14_CONSTEXPR __host__ __device__ const __T &max(const __T &__a, const __T &__b) {return __a < __b ? __b : __a;}template <class __T, class __Cmp>__attribute__((enable_if(true, "")))inline _CPP14_CONSTEXPR __host__ __device__ const __T &min(const __T &__a, const __T &__b, __Cmp __cmp) {return __cmp(__b, __a) ? __b : __a;}template <class __T>__attribute__((enable_if(true, "")))inline _CPP14_CONSTEXPR __host__ __device__ const __T &min(const __T &__a, const __T &__b) {return __a < __b ? __a : __b;}#pragma pop_macro("_CPP14_CONSTEXPR")#ifdef _LIBCPP_END_NAMESPACE_STD_LIBCPP_END_NAMESPACE_STD#else#ifdef _GLIBCXX_BEGIN_NAMESPACE_VERSION_GLIBCXX_END_NAMESPACE_VERSION#endif} // namespace std#endif#endif // __CLANG_CUDA_WRAPPERS_ALGORITHM