alpaka/MemFenceUniformCudaHipBuiltIn_8hpp_source.html

/* Copyright 2022 Jan Stephan, Andrea Bocci, Bernhard Manfred Gruber

 * SPDX-License-Identifier: MPL-2.0

 */


#pragma once


#include "alpaka/core/Config.hpp"

#include "alpaka/core/Interface.hpp"

#include "alpaka/mem/fence/Traits.hpp"


#if defined(ALPAKA_ACC_GPU_CUDA_ENABLED) || defined(ALPAKA_ACC_GPU_HIP_ENABLED)


namespace alpaka

{

    //! The GPU CUDA/HIP memory fence.


    class MemFenceUniformCudaHipBuiltIn : public interface::Implements<ConceptMemFence, MemFenceUniformCudaHipBuiltIn>

    {

    };


#    if !defined(ALPAKA_HOST_ONLY)


#        if defined(ALPAKA_ACC_GPU_CUDA_ENABLED) && !ALPAKA_LANG_CUDA

#            error If ALPAKA_ACC_GPU_CUDA_ENABLED is set, the compiler has to support CUDA!

#        endif


#        if defined(ALPAKA_ACC_GPU_HIP_ENABLED) && !ALPAKA_LANG_HIP

#            error If ALPAKA_ACC_GPU_HIP_ENABLED is set, the compiler has to support HIP!

#        endif


    namespace trait

    {

        template<>

        struct MemFence<MemFenceUniformCudaHipBuiltIn, memory_scope::Block>

        {

            __device__ static auto mem_fence(MemFenceUniformCudaHipBuiltIn const&, memory_scope::Block const&)

            {

                __threadfence_block();

            }

        };


        template<>

        struct MemFence<MemFenceUniformCudaHipBuiltIn, memory_scope::Grid>

        {

            __device__ static auto mem_fence(MemFenceUniformCudaHipBuiltIn const&, memory_scope::Grid const&)

            {

                // CUDA and HIP do not have a per-grid memory fence, so a device-level fence is used

                __threadfence();

            }

        };


        template<>

        struct MemFence<MemFenceUniformCudaHipBuiltIn, memory_scope::Device>

        {

            __device__ static auto mem_fence(MemFenceUniformCudaHipBuiltIn const&, memory_scope::Device const&)

            {

                __threadfence();

            }

        };

    } // namespace trait


#    endif


} // namespace alpaka


#endif

Config.hpp

Interface.hpp

alpaka::MemFenceUniformCudaHipBuiltIn
The GPU CUDA/HIP memory fence.
Definition MemFenceUniformCudaHipBuiltIn.hpp:17

Traits.hpp

alpaka
The alpaka accelerator library.
Definition AccCpuOmp2Blocks.hpp:52

alpaka::mem_fence
ALPAKA_NO_HOST_ACC_WARNING ALPAKA_FN_ACC auto mem_fence(TMemFence const &fence, TMemScope const &scope) -> void
Issues memory fence instructions.
Definition Traits.hpp:61

alpaka::interface::Implements
Tag used in class inheritance hierarchies that describes that a specific interface (TInterface) is im...
Definition Interface.hpp:15

alpaka::memory_scope::Block
Memory fences are observed by all threads in the same block.
Definition Traits.hpp:20