alpaka
Abstraction Library for Parallel Kernel Acceleration
Loading...
Searching...
No Matches
CudaHipCommon.hpp
Go to the documentation of this file.
1/* Copyright 2023 Axel Hübl, Benjamin Worpitz, Matthias Werner, René Widera, Andrea Bocci, Bernhard Manfred Gruber,
2 Jan Stephan
3 * SPDX-License-Identifier: MPL-2.0
4 */
5
6#pragma once
7
10#include "alpaka/idx/Traits.hpp"
14#include "alpaka/vec/Vec.hpp"
15
16#include <tuple>
17
18#if defined(ALPAKA_ACC_GPU_CUDA_ENABLED) || defined(ALPAKA_ACC_GPU_HIP_ENABLED)
19
20# ifdef ALPAKA_ACC_GPU_CUDA_ENABLED
21# include <cuda.h>
22# include <cuda_runtime.h>
23# endif
24
25# ifdef ALPAKA_ACC_GPU_HIP_ENABLED
26# if ALPAKA_COMP_HIP >= ALPAKA_VERSION_NUMBER(6, 2, 0) && ALPAKA_COMP_HIP < ALPAKA_VERSION_NUMBER(7, 0, 0)
27# define HIP_ENABLE_WARP_SYNC_BUILTINS
28# endif
29# include <hip/hip_runtime.h>
30# endif
31
32namespace alpaka
33{
34 namespace detail
35 {
37 tuple<char1, double1, float1, int1, long1, longlong1, short1, uchar1, uint1, ulong1, ulonglong1, ushort1>;
39 tuple<char2, double2, float2, int2, long2, longlong2, short2, uchar2, uint2, ulong2, ulonglong2, ushort2>;
40 using CudaHipBuiltinTypes3 = std::tuple<
41 char3,
42 dim3,
43 double3,
44 float3,
45 int3,
46 long3,
47 longlong3,
48 short3,
49 uchar3,
50 uint3,
51 ulong3,
52 ulonglong3,
53 ushort3
54// CUDA built-in variables have special types in clang native CUDA compilation
55// defined in cuda_builtin_vars.h
56# if ALPAKA_COMP_CLANG_CUDA
57 ,
58 __cuda_builtin_threadIdx_t,
59 __cuda_builtin_blockIdx_t,
60 __cuda_builtin_blockDim_t,
61 __cuda_builtin_gridDim_t
62# endif
63 >;
65 tuple<char4, double4, float4, int4, long4, longlong4, short4, uchar4, uint4, ulong4, ulonglong4, ushort4>;
66 using CudaHipBuiltinTypes = meta::
67 Concatenate<CudaHipBuiltinTypes1, CudaHipBuiltinTypes2, CudaHipBuiltinTypes3, CudaHipBuiltinTypes4>;
68
69 template<typename T>
71 } // namespace detail
72
73# ifdef ALPAKA_ACC_GPU_CUDA_ENABLED
74 namespace cuda::trait
75 {
76 template<typename T>
77 inline constexpr auto isCudaBuiltInType = alpaka::detail::isCudaHipBuiltInType<T>;
78 } // namespace cuda::trait
79# endif
80
81# ifdef ALPAKA_ACC_GPU_HIP_ENABLED
82 namespace hip::trait
83 {
84 template<typename T>
85 inline constexpr auto isHipBuiltInType = alpaka::detail::isCudaHipBuiltInType<T>;
86 } // namespace hip::trait
87# endif
88
89 namespace trait
90 {
91 //! The CUDA/HIP vectors 1D dimension get trait specialization.
92 template<typename T>
93 struct DimType<T, std::enable_if_t<meta::Contains<alpaka::detail::CudaHipBuiltinTypes1, T>::value>>
94 {
96 };
97
98 //! The CUDA/HIP vectors 2D dimension get trait specialization.
99 template<typename T>
100 struct DimType<T, std::enable_if_t<meta::Contains<alpaka::detail::CudaHipBuiltinTypes2, T>::value>>
101 {
103 };
104
105 //! The CUDA/HIP vectors 3D dimension get trait specialization.
106 template<typename T>
107 struct DimType<T, std::enable_if_t<meta::Contains<alpaka::detail::CudaHipBuiltinTypes3, T>::value>>
108 {
110 };
111
112 //! The CUDA/HIP vectors 4D dimension get trait specialization.
113 template<typename T>
114 struct DimType<T, std::enable_if_t<meta::Contains<alpaka::detail::CudaHipBuiltinTypes4, T>::value>>
115 {
117 };
118
119 //! The CUDA/HIP vectors elem type trait specialization.
120 template<typename T>
121 struct ElemType<T, std::enable_if_t<alpaka::detail::isCudaHipBuiltInType<T>>>
122 {
123 using type = decltype(std::declval<T>().x);
124 };
125
126 template<typename TCudaHipBuiltin>
127 struct GetExtents<TCudaHipBuiltin, std::enable_if_t<alpaka::detail::isCudaHipBuiltInType<TCudaHipBuiltin>>>
128 {
130 ALPAKA_FN_HOST_ACC auto operator()(TCudaHipBuiltin const& value) const
132 {
133 constexpr auto dim = Dim<TCudaHipBuiltin>::value;
134 if constexpr(dim == 1)
135 return {value.x};
136 else if constexpr(dim == 2)
137 return {value.y, value.x};
138 else if constexpr(dim == 3)
139 return {value.z, value.y, value.x};
140 else if constexpr(dim == 4)
141 return {value.w, value.z, value.y, value.x};
142 else
143 static_assert(sizeof(value) == 0, "Not implemented");
144
146 }
147 };
148
149 template<typename TCudaHipBuiltin>
150 struct GetOffsets<TCudaHipBuiltin, std::enable_if_t<alpaka::detail::isCudaHipBuiltInType<TCudaHipBuiltin>>>
151 : GetExtents<TCudaHipBuiltin>
152 {
153 };
154
155 //! The CUDA/HIP vectors idx type trait specialization.
156 template<typename TIdx>
157 struct IdxType<TIdx, std::enable_if_t<alpaka::detail::isCudaHipBuiltInType<TIdx>>>
158 {
159 using type = std::size_t;
160 };
161 } // namespace trait
162} // namespace alpaka
163
164#endif
#define ALPAKA_UNREACHABLE(...)
Before CUDA 11.5 nvcc is unable to correctly identify return statements in 'if constexpr' branches....
A n-dimensional vector.
Definition Vec.hpp:38
#define ALPAKA_FN_HOST_ACC
Definition Common.hpp:42
#define ALPAKA_NO_HOST_ACC_WARNING
Disable nvcc warning: 'calling a host function from host device function.' Usage: ALPAKA_NO_HOST_ACC_...
Definition Common.hpp:85
constexpr auto isCudaBuiltInType
std::tuple< char3, dim3, double3, float3, int3, long3, longlong3, short3, uchar3, uint3, ulong3, ulonglong3, ushort3 > CudaHipBuiltinTypes3
constexpr auto isCudaHipBuiltInType
std::tuple< char2, double2, float2, int2, long2, longlong2, short2, uchar2, uint2, ulong2, ulonglong2, ushort2 > CudaHipBuiltinTypes2
std::tuple< char1, double1, float1, int1, long1, longlong1, short1, uchar1, uint1, ulong1, ulonglong1, ushort1 > CudaHipBuiltinTypes1
meta::Concatenate< CudaHipBuiltinTypes1, CudaHipBuiltinTypes2, CudaHipBuiltinTypes3, CudaHipBuiltinTypes4 > CudaHipBuiltinTypes
std::tuple< char4, double4, float4, int4, long4, longlong4, short4, uchar4, uint4, ulong4, ulonglong4, ushort4 > CudaHipBuiltinTypes4
The alpaka accelerator library.
typename trait::IdxType< T >::type Idx
Definition Traits.hpp:29
std::integral_constant< std::size_t, N > DimInt
typename trait::DimType< T >::type Dim
The dimension type trait alias template to remove the ::type.
Definition Traits.hpp:19
STL namespace.
The dimension getter type trait.
Definition Traits.hpp:14
The element type trait.
Definition Traits.hpp:16
ALPAKA_NO_HOST_ACC_WARNING ALPAKA_FN_HOST_ACC auto operator()(TCudaHipBuiltin const &value) const -> Vec< Dim< TCudaHipBuiltin >, Idx< TCudaHipBuiltin > >
The GetExtents trait for getting the extents of an object as an alpaka::Vec.
Definition Traits.hpp:37
The GetOffsets trait for getting the offsets of an object as an alpaka::Vec.
Definition Traits.hpp:33
The idx type trait.
Definition Traits.hpp:25