10#ifdef ALPAKA_ACC_GPU_HIP_ENABLED
12# include <hip/hip_runtime_api.h>
13# include <hip/hip_version.h>
20 static constexpr char name[] =
"Hip";
24 using DeviceAttr_t = ::hipDeviceAttribute_t;
25 using DeviceProp_t = ::hipDeviceProp_t;
26 using Error_t = ::hipError_t;
27 using Event_t = ::hipEvent_t;
28 using Extent_t = ::hipExtent;
29 using Flag_t =
unsigned int;
30 using FuncAttributes_t = ::hipFuncAttributes;
31 using HostFn_t = void (*)(
void* data);
32 using Limit_t = ::hipLimit_t;
33 using Memcpy3DParms_t = ::hipMemcpy3DParms;
34 using MemcpyKind_t = ::hipMemcpyKind;
35 using PitchedPtr_t = ::hipPitchedPtr;
36 using Pos_t = ::hipPos;
37 using Stream_t = ::hipStream_t;
40 static constexpr Error_t success = ::hipSuccess;
41 static constexpr Error_t errorNotReady = ::hipErrorNotReady;
42 static constexpr Error_t errorHostMemoryAlreadyRegistered = ::hipErrorHostMemoryAlreadyRegistered;
43 static constexpr Error_t errorHostMemoryNotRegistered = ::hipErrorHostMemoryNotRegistered;
44 static constexpr Error_t errorUnsupportedLimit = ::hipErrorUnsupportedLimit;
45 static constexpr Error_t errorUnknown = ::hipErrorUnknown;
47 static constexpr Flag_t eventDefault = hipEventDefault;
48 static constexpr Flag_t eventBlockingSync = hipEventBlockingSync;
49 static constexpr Flag_t eventDisableTiming = hipEventDisableTiming;
50 static constexpr Flag_t eventInterprocess = hipEventInterprocess;
52 static constexpr Flag_t hostMallocDefault = hipHostMallocDefault;
53 static constexpr Flag_t hostMallocMapped = hipHostMallocMapped;
54 static constexpr Flag_t hostMallocPortable = hipHostMallocPortable;
55 static constexpr Flag_t hostMallocWriteCombined = hipHostMallocWriteCombined;
56 static constexpr Flag_t hostMallocCoherent = hipHostMallocCoherent;
57 static constexpr Flag_t hostMallocNonCoherent = hipHostMallocNonCoherent;
59 static constexpr Flag_t memAttachGlobal = hipMemAttachGlobal;
60 static constexpr Flag_t memAttachHost = hipMemAttachHost;
62 static constexpr Flag_t hostRegisterDefault = hipHostRegisterDefault;
63 static constexpr Flag_t hostRegisterPortable = hipHostRegisterPortable;
64 static constexpr Flag_t hostRegisterMapped = hipHostRegisterMapped;
65 static constexpr Flag_t hostRegisterIoMemory = hipHostRegisterIoMemory;
67 static constexpr MemcpyKind_t memcpyDefault = ::hipMemcpyDefault;
68 static constexpr MemcpyKind_t memcpyDeviceToDevice = ::hipMemcpyDeviceToDevice;
69 static constexpr MemcpyKind_t memcpyDeviceToHost = ::hipMemcpyDeviceToHost;
70 static constexpr MemcpyKind_t memcpyHostToDevice = ::hipMemcpyHostToDevice;
72 static constexpr Flag_t streamDefault = hipStreamDefault;
73 static constexpr Flag_t streamNonBlocking = hipStreamNonBlocking;
75 static constexpr DeviceAttr_t deviceAttributeMaxBlockDimX = ::hipDeviceAttributeMaxBlockDimX;
76 static constexpr DeviceAttr_t deviceAttributeMaxBlockDimY = ::hipDeviceAttributeMaxBlockDimY;
77 static constexpr DeviceAttr_t deviceAttributeMaxBlockDimZ = ::hipDeviceAttributeMaxBlockDimZ;
78 static constexpr DeviceAttr_t deviceAttributeMaxGridDimX = ::hipDeviceAttributeMaxGridDimX;
79 static constexpr DeviceAttr_t deviceAttributeMaxGridDimY = ::hipDeviceAttributeMaxGridDimY;
80 static constexpr DeviceAttr_t deviceAttributeMaxGridDimZ = ::hipDeviceAttributeMaxGridDimZ;
81 static constexpr DeviceAttr_t deviceAttributeMaxSharedMemoryPerBlock
82 = ::hipDeviceAttributeMaxSharedMemoryPerBlock;
83 static constexpr DeviceAttr_t deviceAttributeMaxThreadsPerBlock = ::hipDeviceAttributeMaxThreadsPerBlock;
84 static constexpr DeviceAttr_t deviceAttributeMultiprocessorCount = ::hipDeviceAttributeMultiprocessorCount;
85 static constexpr DeviceAttr_t deviceAttributeWarpSize = ::hipDeviceAttributeWarpSize;
87# if HIP_VERSION >= 40'500'000
88 static constexpr Limit_t limitPrintfFifoSize = ::hipLimitPrintfFifoSize;
90 static constexpr Limit_t limitPrintfFifoSize
91 =
static_cast<Limit_t
>(0x01);
93 static constexpr Limit_t limitMallocHeapSize = ::hipLimitMallocHeapSize;
103 static void hostFunction(
void* data)
105 auto ptr =
reinterpret_cast<HostFnAdaptor*
>(data);
106 ptr->func_(ptr->data_);
110 static void streamCallback(Stream_t, Error_t,
void* data)
112 auto ptr =
reinterpret_cast<HostFnAdaptor*
>(data);
113 ptr->func_(ptr->data_);
119 static inline Error_t deviceGetAttribute(
int* value, DeviceAttr_t attr,
int device)
121 return ::hipDeviceGetAttribute(value, attr, device);
124 static inline Error_t deviceGetLimit(
size_t* pValue, Limit_t limit)
126# if HIP_VERSION < 40'500'000
127 if(limit == limitPrintfFifoSize)
130 return errorUnsupportedLimit;
133 return ::hipDeviceGetLimit(pValue, limit);
136 static inline Error_t deviceReset()
138 return ::hipDeviceReset();
141 static inline Error_t deviceSetLimit(Limit_t ,
size_t )
144 return errorUnsupportedLimit;
147 static inline Error_t deviceSynchronize()
149 return ::hipDeviceSynchronize();
152 static inline Error_t eventCreate(Event_t* event)
154 return ::hipEventCreate(event);
157 static inline Error_t eventCreateWithFlags(Event_t* event, Flag_t flags)
159 return ::hipEventCreateWithFlags(event, flags);
162 static inline Error_t eventDestroy(Event_t event)
164 return ::hipEventDestroy(event);
167 static inline Error_t eventQuery(Event_t event)
169 return ::hipEventQuery(event);
172 static inline Error_t eventRecord(Event_t event, Stream_t stream)
174 return ::hipEventRecord(event, stream);
177 static inline Error_t eventSynchronize(Event_t event)
179 return ::hipEventSynchronize(event);
182 static inline Error_t
free(
void* devPtr)
184 return ::hipFree(devPtr);
187 static inline Error_t freeAsync([[maybe_unused]]
void* devPtr, [[maybe_unused]] Stream_t stream)
190# if HIP_VERSION >= 50'300'000
194 return ::hipFreeAsync(devPtr, stream);
206 static inline Error_t funcGetAttributes(FuncAttributes_t* attr,
void const* func)
208 return ::hipFuncGetAttributes(attr, func);
212 static inline Error_t funcGetAttributes(FuncAttributes_t* attr, T* func)
215# pragma GCC diagnostic push
216# pragma GCC diagnostic ignored "-Wconditionally-supported"
218 return ::hipFuncGetAttributes(attr,
reinterpret_cast<void const*
>(func));
220# pragma GCC diagnostic pop
224 static inline int getCurrentDevice()
227 using TApi = alpaka::ApiHipRt;
233 static inline Error_t getDeviceCount(
int* count)
235 return ::hipGetDeviceCount(count);
238 static inline Error_t getDeviceProperties(DeviceProp_t* prop,
int device)
240 return ::hipGetDeviceProperties(prop, device);
243 static inline char const* getErrorName(Error_t error)
245 return ::hipGetErrorName(error);
248 static inline char const* getErrorString(Error_t error)
250 return ::hipGetErrorString(error);
253 static inline Error_t getLastError()
255 return ::hipGetLastError();
258 static inline Error_t getSymbolAddress(
void** devPtr,
void const* symbol)
260 return ::hipGetSymbolAddress(devPtr, symbol);
264 static inline Error_t getSymbolAddress(
void** devPtr, T
const& symbol)
266 return ::hipGetSymbolAddress(devPtr, symbol);
269 static inline Error_t hostGetDevicePointer(
void** pDevice,
void* pHost, Flag_t flags)
271 return ::hipHostGetDevicePointer(pDevice, pHost, flags);
274 static inline Error_t hostFree(
void* ptr)
276 return ::hipHostFree(ptr);
279 static inline Error_t hostMalloc(
void** ptr,
size_t size, Flag_t flags)
281 return ::hipHostMalloc(ptr, size, flags);
284 static inline Error_t hostRegister(
void* ptr,
size_t size, Flag_t flags)
286 return ::hipHostRegister(ptr, size, flags);
289 static inline Error_t hostUnregister(
void* ptr)
291 return ::hipHostUnregister(ptr);
294 static inline Error_t launchHostFunc(Stream_t stream, HostFn_t fn,
void* userData)
297# if HIP_VERSION >= 50'400'000
299 return ::hipLaunchHostFunc(stream, HostFnAdaptor::hostFunction,
new HostFnAdaptor{fn, userData});
302 return ::hipStreamAddCallback(stream, HostFnAdaptor::streamCallback,
new HostFnAdaptor{fn, userData}, 0);
306 static inline Error_t
malloc(
void** devPtr,
size_t size)
308 return ::hipMalloc(devPtr, size);
311 static inline Error_t malloc3D(PitchedPtr_t* pitchedDevPtr, Extent_t extent)
313 return ::hipMalloc3D(pitchedDevPtr, extent);
316 static inline Error_t mallocAsync(
317 [[maybe_unused]]
void** devPtr,
318 [[maybe_unused]]
size_t size,
319 [[maybe_unused]] Stream_t stream)
322# if HIP_VERSION >= 50'600'000
323 return ::hipMallocAsync(devPtr, size, stream);
324# elif HIP_VERSION >= 50'300'000
328 return ::hipMallocAsync(devPtr, size, stream);
342 static inline Error_t mallocManaged(
void** ptr,
size_t size, Flag_t flags)
344 return ::hipMallocManaged(ptr, size, flags);
347 static inline Error_t mallocPitch(
void** devPtr,
size_t* pitch,
size_t width,
size_t height)
349 return ::hipMallocPitch(devPtr, pitch, width, height);
352 static inline Error_t memGetInfo(
size_t* free,
size_t* total)
354 return ::hipMemGetInfo(free, total);
357 static inline Error_t
memcpy(
void* dst,
void const* src,
size_t count, MemcpyKind_t kind)
359 return ::hipMemcpy(dst, src, count, kind);
362 static inline Error_t memcpy2DAsync(
372 return ::hipMemcpy2DAsync(dst, dpitch, src, spitch, width, height, kind, stream);
375 static inline Error_t memcpy3DAsync(Memcpy3DParms_t
const* p, Stream_t stream)
377 return ::hipMemcpy3DAsync(p, stream);
380 static inline Error_t memcpyAsync(
void* dst,
void const* src,
size_t count, MemcpyKind_t kind, Stream_t stream)
382 return ::hipMemcpyAsync(dst, src, count, kind, stream);
385 static inline Error_t memset2DAsync(
393 return ::hipMemset2DAsync(devPtr, pitch, value, width, height, stream);
396 static inline Error_t memset3DAsync(PitchedPtr_t pitchedDevPtr,
int value, Extent_t extent, Stream_t stream)
398 return ::hipMemset3DAsync(pitchedDevPtr, value, extent, stream);
401 static inline Error_t memsetAsync(
void* devPtr,
int value,
size_t count, Stream_t stream)
403 return ::hipMemsetAsync(devPtr, value, count, stream);
406 static inline Error_t setDevice(
int device)
408 return ::hipSetDevice(device);
411 static inline Error_t streamCreate(Stream_t* pStream)
413 return ::hipStreamCreate(pStream);
416 static inline Error_t streamCreateWithFlags(Stream_t* pStream, Flag_t flags)
418 return ::hipStreamCreateWithFlags(pStream, flags);
421 static inline Error_t streamDestroy(Stream_t stream)
423 return ::hipStreamDestroy(stream);
426 static inline Error_t streamQuery(Stream_t stream)
428 return ::hipStreamQuery(stream);
431 static inline Error_t streamSynchronize(Stream_t stream)
433 return ::hipStreamSynchronize(stream);
436 static inline Error_t streamWaitEvent(Stream_t stream, Event_t event, Flag_t flags)
438 return ::hipStreamWaitEvent(stream, event, flags);
441 static inline PitchedPtr_t makePitchedPtr(
void* d,
size_t p,
size_t xsz,
size_t ysz)
443 return ::make_hipPitchedPtr(d, p, xsz, ysz);
446 static inline Pos_t makePos(
size_t x,
size_t y,
size_t z)
448 return ::make_hipPos(x, y, z);
451 static inline Extent_t makeExtent(
size_t w,
size_t h,
size_t d)
453 return ::make_hipExtent(w, h, d);
#define ALPAKA_VERSION_NUMBER(major, minor, patch)
The alpaka accelerator library.
ALPAKA_FN_HOST auto free(TAlloc const &alloc, T const *const ptr) -> void
Frees the memory identified by the given pointer.
ALPAKA_FN_HOST auto memcpy(TQueue &queue, alpaka::detail::DevGlobalImplGeneric< TTag, TTypeDst > &viewDst, TViewSrc const &viewSrc) -> void
ALPAKA_FN_HOST auto malloc(TAlloc const &alloc, std::size_t const &sizeElems) -> T *