alpaka/AllocCpuAligned_8hpp_source.html

/* Copyright 2022 Axel Huebl, Benjamin Worpitz, Jan Stephan, Andrea Bocci, Bernhard Manfred Gruber

 * SPDX-License-Identifier: MPL-2.0

 */


#pragma once


#include "alpaka/core/AlignedAlloc.hpp"

#include "alpaka/core/Common.hpp"

#include "alpaka/core/Interface.hpp"

#include "alpaka/dev/cpu/SysInfo.hpp"

#include "alpaka/mem/alloc/Traits.hpp"


#include <algorithm>


namespace alpaka

{

    //! The CPU boost aligned allocator.

    //!

    //! \tparam TAlignment An integral constant containing the alignment.

    template<typename TAlignment>


    class AllocCpuAligned : public interface::Implements<ConceptMemAlloc, AllocCpuAligned<TAlignment>>

    {

    };


    namespace trait

    {

        //! The CPU boost aligned allocator memory allocation trait specialization.

        template<typename T, typename TAlignment>

        struct Malloc<T, AllocCpuAligned<TAlignment>>

        {

            ALPAKA_FN_HOST static auto malloc(

                AllocCpuAligned<TAlignment> const& /* alloc */,

                std::size_t const& sizeElems) -> T*

            {

#if defined(ALPAKA_ACC_GPU_CUDA_ENABLED) || defined(ALPAKA_ACC_GPU_HIP_ENABLED)

                // For CUDA/HIP host memory must be aligned to 4 kib to pin it with `cudaHostRegister`,

                // this was described in older programming guides but was removed later.

                // From testing with PIConGPU and cuda-memcheck we found out that the alignment is still required.

                //

                // For HIP the required alignment is the size of a cache line.

                // https://rocm-developer-tools.github.io/HIP/group__Memory.html#gab8258f051e1a1f7385f794a15300e674

                // On most x86 systems the page size is 4KiB and on OpenPower 64KiB.

                // Page size can be tested on the terminal with: `getconf PAGE_SIZE`

                size_t minAlignement = std::max<size_t>(TAlignment::value, cpu::detail::getPageSize());

#else

                constexpr size_t minAlignement = TAlignment::value;

#endif

                return reinterpret_cast<T*>(core::alignedAlloc(minAlignement, sizeElems * sizeof(T)));

            }

        };


        //! The CPU boost aligned allocator memory free trait specialization.

        template<typename T, typename TAlignment>

        struct Free<T, AllocCpuAligned<TAlignment>>

        {

            ALPAKA_FN_HOST static auto free(AllocCpuAligned<TAlignment> const& /* alloc */, T const* const ptr) -> void

            {

#if defined(ALPAKA_ACC_GPU_CUDA_ENABLED) || defined(ALPAKA_ACC_GPU_HIP_ENABLED)

                size_t minAlignement = std::max<size_t>(TAlignment::value, cpu::detail::getPageSize());

#else

                constexpr size_t minAlignement = TAlignment::value;

#endif

                core::alignedFree(minAlignement, const_cast<void*>(reinterpret_cast<void const*>(ptr)));

            }

        };

    } // namespace trait

} // namespace alpaka

AlignedAlloc.hpp

Interface.hpp

SysInfo.hpp

alpaka::AllocCpuAligned
The CPU boost aligned allocator.
Definition AllocCpuAligned.hpp:22

Common.hpp

ALPAKA_FN_HOST
#define ALPAKA_FN_HOST
Definition Common.hpp:40

Traits.hpp

alpaka::core::alignedFree
ALPAKA_FN_INLINE ALPAKA_FN_HOST void alignedFree(size_t alignment, void *ptr)
Definition AlignedAlloc.hpp:26

alpaka::core::alignedAlloc
ALPAKA_FN_INLINE ALPAKA_FN_HOST auto alignedAlloc(size_t alignment, size_t size) -> void *
Definition AlignedAlloc.hpp:14

alpaka::cpu::detail::getPageSize
size_t getPageSize()
Definition SysInfo.hpp:124

alpaka
The alpaka accelerator library.
Definition AccCpuOmp2Blocks.hpp:52

alpaka::free
ALPAKA_FN_HOST auto free(TAlloc const &alloc, T const *const ptr) -> void
Frees the memory identified by the given pointer.
Definition Traits.hpp:41

alpaka::malloc
ALPAKA_FN_HOST auto malloc(TAlloc const &alloc, std::size_t const &sizeElems) -> T *
Definition Traits.hpp:33

alpaka::interface::Implements
Tag used in class inheritance hierarchies that describes that a specific interface (TInterface) is im...
Definition Interface.hpp:15