108533a3eSJohannes Doerfert //===--- DeviceUtils.h - OpenMP device runtime utility functions -- C++ -*-===// 208533a3eSJohannes Doerfert // 308533a3eSJohannes Doerfert // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 408533a3eSJohannes Doerfert // See https://llvm.org/LICENSE.txt for license information. 508533a3eSJohannes Doerfert // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 608533a3eSJohannes Doerfert // 708533a3eSJohannes Doerfert //===----------------------------------------------------------------------===// 808533a3eSJohannes Doerfert // 908533a3eSJohannes Doerfert // 1008533a3eSJohannes Doerfert //===----------------------------------------------------------------------===// 1108533a3eSJohannes Doerfert 1208533a3eSJohannes Doerfert #ifndef OMPTARGET_DEVICERTL_DEVICE_UTILS_H 1308533a3eSJohannes Doerfert #define OMPTARGET_DEVICERTL_DEVICE_UTILS_H 1408533a3eSJohannes Doerfert 1508533a3eSJohannes Doerfert #include "DeviceTypes.h" 1608533a3eSJohannes Doerfert #include "Shared/Utils.h" 1708533a3eSJohannes Doerfert 1808533a3eSJohannes Doerfert #pragma omp begin declare target device_type(nohost) 1908533a3eSJohannes Doerfert 2008533a3eSJohannes Doerfert namespace utils { 2108533a3eSJohannes Doerfert 22b57c0bacSJoseph Huber template <typename T> struct type_identity { 23b57c0bacSJoseph Huber using type = T; 24b57c0bacSJoseph Huber }; 25b57c0bacSJoseph Huber 26b57c0bacSJoseph Huber template <typename T, T v> struct integral_constant { 27b57c0bacSJoseph Huber inline static constexpr T value = v; 28b57c0bacSJoseph Huber }; 29b57c0bacSJoseph Huber 30b57c0bacSJoseph Huber /// Freestanding SFINAE helpers. 31b57c0bacSJoseph Huber template <class T> struct remove_cv : type_identity<T> {}; 32b57c0bacSJoseph Huber template <class T> struct remove_cv<const T> : type_identity<T> {}; 33b57c0bacSJoseph Huber template <class T> struct remove_cv<volatile T> : type_identity<T> {}; 34b57c0bacSJoseph Huber template <class T> struct remove_cv<const volatile T> : type_identity<T> {}; 35b57c0bacSJoseph Huber template <class T> using remove_cv_t = typename remove_cv<T>::type; 36b57c0bacSJoseph Huber 37b57c0bacSJoseph Huber using true_type = integral_constant<bool, true>; 38b57c0bacSJoseph Huber using false_type = integral_constant<bool, false>; 39b57c0bacSJoseph Huber 40b57c0bacSJoseph Huber template <typename T, typename U> struct is_same : false_type {}; 41b57c0bacSJoseph Huber template <typename T> struct is_same<T, T> : true_type {}; 42b57c0bacSJoseph Huber template <typename T, typename U> 43b57c0bacSJoseph Huber inline constexpr bool is_same_v = is_same<T, U>::value; 44b57c0bacSJoseph Huber 45b57c0bacSJoseph Huber template <typename T> struct is_floating_point { 46b57c0bacSJoseph Huber inline static constexpr bool value = 47*74d5373fSJoseph Huber is_same_v<remove_cv_t<T>, float> || is_same_v<remove_cv_t<T>, double>; 48b57c0bacSJoseph Huber }; 49b57c0bacSJoseph Huber template <typename T> 50b57c0bacSJoseph Huber inline constexpr bool is_floating_point_v = is_floating_point<T>::value; 51b57c0bacSJoseph Huber 52b57c0bacSJoseph Huber template <bool B, typename T = void> struct enable_if; 53b57c0bacSJoseph Huber template <typename T> struct enable_if<true, T> : type_identity<T> {}; 54b57c0bacSJoseph Huber template <bool B, typename T = void> 55b57c0bacSJoseph Huber using enable_if_t = typename enable_if<B, T>::type; 56b57c0bacSJoseph Huber 57b57c0bacSJoseph Huber template <class T> struct remove_addrspace : type_identity<T> {}; 58b57c0bacSJoseph Huber template <class T, int N> 59b57c0bacSJoseph Huber struct remove_addrspace<T [[clang::address_space(N)]]> : type_identity<T> {}; 60b57c0bacSJoseph Huber template <class T> 61b57c0bacSJoseph Huber using remove_addrspace_t = typename remove_addrspace<T>::type; 62b57c0bacSJoseph Huber 63f53cb84dSJoseph Huber template <typename To, typename From> inline To bitCast(From V) { 64f53cb84dSJoseph Huber static_assert(sizeof(To) == sizeof(From), "Bad conversion"); 65f53cb84dSJoseph Huber return __builtin_bit_cast(To, V); 66f53cb84dSJoseph Huber } 67f53cb84dSJoseph Huber 6808533a3eSJohannes Doerfert /// Return the value \p Var from thread Id \p SrcLane in the warp if the thread 6908533a3eSJohannes Doerfert /// is identified by \p Mask. 7008533a3eSJohannes Doerfert int32_t shuffle(uint64_t Mask, int32_t Var, int32_t SrcLane, int32_t Width); 7108533a3eSJohannes Doerfert 7208533a3eSJohannes Doerfert int32_t shuffleDown(uint64_t Mask, int32_t Var, uint32_t Delta, int32_t Width); 7308533a3eSJohannes Doerfert 7408533a3eSJohannes Doerfert int64_t shuffleDown(uint64_t Mask, int64_t Var, uint32_t Delta, int32_t Width); 7508533a3eSJohannes Doerfert 7608533a3eSJohannes Doerfert uint64_t ballotSync(uint64_t Mask, int32_t Pred); 7708533a3eSJohannes Doerfert 7808533a3eSJohannes Doerfert /// Return \p LowBits and \p HighBits packed into a single 64 bit value. 7908533a3eSJohannes Doerfert uint64_t pack(uint32_t LowBits, uint32_t HighBits); 8008533a3eSJohannes Doerfert 8108533a3eSJohannes Doerfert /// Unpack \p Val into \p LowBits and \p HighBits. 8208533a3eSJohannes Doerfert void unpack(uint64_t Val, uint32_t &LowBits, uint32_t &HighBits); 8308533a3eSJohannes Doerfert 8408533a3eSJohannes Doerfert /// Return true iff \p Ptr is pointing into shared (local) memory (AS(3)). 8508533a3eSJohannes Doerfert bool isSharedMemPtr(void *Ptr); 8608533a3eSJohannes Doerfert 8708533a3eSJohannes Doerfert /// Return true iff \p Ptr is pointing into (thread) local memory (AS(5)). 8808533a3eSJohannes Doerfert bool isThreadLocalMemPtr(void *Ptr); 8908533a3eSJohannes Doerfert 9008533a3eSJohannes Doerfert /// A pointer variable that has by design an `undef` value. Use with care. 9108533a3eSJohannes Doerfert [[clang::loader_uninitialized]] static void *const UndefPtr; 9208533a3eSJohannes Doerfert 9308533a3eSJohannes Doerfert #define OMP_LIKELY(EXPR) __builtin_expect((bool)(EXPR), true) 9408533a3eSJohannes Doerfert #define OMP_UNLIKELY(EXPR) __builtin_expect((bool)(EXPR), false) 9508533a3eSJohannes Doerfert 9608533a3eSJohannes Doerfert } // namespace utils 9708533a3eSJohannes Doerfert 9808533a3eSJohannes Doerfert #pragma omp end declare target 9908533a3eSJohannes Doerfert 10008533a3eSJohannes Doerfert #endif 101