alpaka/BlockSharedMemStUniformCudaHipBuiltIn_8hpp_source.html

/* Copyright 2022 Benjamin Worpitz, Erik Zenker, René Widera, Matthias Werner, Andrea Bocci, Bernhard Manfred Gruber

 * SPDX-License-Identifier: MPL-2.0

 */


#pragma once


#include "alpaka/block/shared/st/Traits.hpp"

#include "alpaka/core/Config.hpp"

#include "alpaka/core/Interface.hpp"


#include <cstdint>

#include <type_traits>


#if defined(ALPAKA_ACC_GPU_CUDA_ENABLED) || defined(ALPAKA_ACC_GPU_HIP_ENABLED)


namespace alpaka

{

    //! The GPU CUDA/HIP block shared memory allocator.


    class BlockSharedMemStUniformCudaHipBuiltIn

        : public interface::Implements<ConceptBlockSharedSt, BlockSharedMemStUniformCudaHipBuiltIn>

    {

    };


#    if !defined(ALPAKA_HOST_ONLY)


#        if defined(ALPAKA_ACC_GPU_CUDA_ENABLED) && !ALPAKA_LANG_CUDA

#            error If ALPAKA_ACC_GPU_CUDA_ENABLED is set, the compiler has to support CUDA!

#        endif


#        if defined(ALPAKA_ACC_GPU_HIP_ENABLED) && !ALPAKA_LANG_HIP

#            error If ALPAKA_ACC_GPU_HIP_ENABLED is set, the compiler has to support HIP!

#        endif


    namespace trait

    {

        template<typename T, std::size_t TuniqueId>

        struct DeclareSharedVar<T, TuniqueId, BlockSharedMemStUniformCudaHipBuiltIn>

        {

            __device__ static auto declareVar(BlockSharedMemStUniformCudaHipBuiltIn const&) -> T&

            {

                __shared__ uint8_t shMem alignas(alignof(T))[sizeof(T)];

                return *(reinterpret_cast<T*>(shMem));

            }

        };


        template<>

        struct FreeSharedVars<BlockSharedMemStUniformCudaHipBuiltIn>

        {

            __device__ static auto freeVars(BlockSharedMemStUniformCudaHipBuiltIn const&) -> void

            {

                // Nothing to do. CUDA/HIP block shared memory is automatically freed when all threads left the block.

            }

        };

    } // namespace trait


#    endif


} // namespace alpaka


#endif

Config.hpp

Interface.hpp

Traits.hpp

alpaka::BlockSharedMemStUniformCudaHipBuiltIn
The GPU CUDA/HIP block shared memory allocator.
Definition BlockSharedMemStUniformCudaHipBuiltIn.hpp:21

alpaka
The alpaka accelerator library.
Definition AccCpuOmp2Blocks.hpp:52

alpaka::interface::Implements
Tag used in class inheritance hierarchies that describes that a specific interface (TInterface) is im...
Definition Interface.hpp:15