alpaka/KernelExecutionFixture_8hpp_source.html

/* Copyright 2024 Benjamin Worpitz, Andrea Bocci, Bernhard Manfred Gruber, Jan Stephan, Aurora Perego

 * SPDX-License-Identifier: MPL-2.0

 */


#pragma once


#include "alpaka/alpaka.hpp"


#if defined(ALPAKA_ACC_GPU_CUDA_ENABLED) && !ALPAKA_LANG_CUDA

#    error If ALPAKA_ACC_GPU_CUDA_ENABLED is set, the compiler has to support CUDA!

#endif


#if defined(ALPAKA_ACC_GPU_HIP_ENABLED) && !ALPAKA_LANG_HIP

#    error If ALPAKA_ACC_GPU_HIP_ENABLED is set, the compiler has to support HIP!

#endif


#include "alpaka/test/Check.hpp"

#include "alpaka/test/queue/Queue.hpp"


#include <utility>


namespace alpaka::test

{

    //! The fixture for executing a kernel on a given accelerator.

    template<typename TAcc>


    class KernelExecutionFixture

    {

    public:

        using Acc = TAcc;

        using Tag = alpaka::AccToTag<Acc>;

        using Dim = alpaka::Dim<Acc>;

        using Idx = alpaka::Idx<Acc>;

        using Platform = alpaka::Platform<Acc>;

        using Device = Dev<Acc>;

        using Queue = test::DefaultQueue<Device>;

        using WorkDiv = WorkDivMembers<Dim, Idx>;


        KernelExecutionFixture(WorkDiv workDiv) : m_queue{m_device}, m_workDiv{std::move(workDiv)}

        {

        }


        template<typename TExtent>


        KernelExecutionFixture(TExtent const& extent) : m_queue{m_device}

                                                      , m_extent{extent}

        {

        }


        KernelExecutionFixture(Queue queue, WorkDiv workDiv)

            : m_platform{} // if the platform is not stateless, this is wrong; we ignore it because it is not be used

            , m_device{alpaka::getDev(queue)}

            , m_queue{std::move(queue)}

            , m_workDiv{std::move(workDiv)}

        {

        }


        template<typename TExtent>


        KernelExecutionFixture(Queue queue, TExtent const& extent)

            : m_platform{} // if the platform is not stateless, this is wrong; we ignore it because it is not be used

            , m_device{alpaka::getDev(queue)}

            , m_queue{std::move(queue)}

            , m_extent{extent}

        {

        }


        template<typename TKernelFnObj, typename... TArgs>


        auto operator()(TKernelFnObj kernelFnObj, TArgs&&... args) -> bool

        {

            // Allocate the result value

            auto bufAccResult = allocBuf<bool, Idx>(m_device, static_cast<Idx>(1u));

            memset(m_queue, bufAccResult, static_cast<std::uint8_t>(true));


            alpaka::KernelCfg<Acc> const kernelCfg = {m_extent, Vec<Dim, Idx>::ones()};


            // set workdiv if it is not before

            if(m_workDiv == WorkDiv{Vec<Dim, Idx>::all(0), Vec<Dim, Idx>::all(0), Vec<Dim, Idx>::all(0)})

                m_workDiv = alpaka::getValidWorkDiv(

                    kernelCfg,

                    m_device,

                    kernelFnObj,

                    getPtrNative(bufAccResult),

                    std::forward<TArgs>(args)...);


            exec<Tag>(m_queue, m_workDiv, kernelFnObj, getPtrNative(bufAccResult), std::forward<TArgs>(args)...);


            // Copy the result value to the host

            auto bufHostResult = allocBuf<bool, Idx>(m_devHost, static_cast<Idx>(1u));

            memcpy(m_queue, bufHostResult, bufAccResult);

            wait(m_queue);


            auto const result = *getPtrNative(bufHostResult);


            return result;

        }


    private:

        PlatformCpu m_platformHost{};

        DevCpu m_devHost{getDevByIdx(m_platformHost, 0)};

        Platform m_platform{};

        Device m_device{getDevByIdx(m_platform, 0)};

        Queue m_queue;

        WorkDiv m_workDiv{Vec<Dim, Idx>::all(0), Vec<Dim, Idx>::all(0), Vec<Dim, Idx>::all(0)};

        Vec<Dim, Idx> m_extent;

    };


} // namespace alpaka::test

Check.hpp

Queue.hpp

alpaka.hpp

alpaka::DevCpu
The CPU device handle.
Definition DevCpu.hpp:56

alpaka::Vec::ones
ALPAKA_NO_HOST_ACC_WARNING static ALPAKA_FN_HOST_ACC constexpr auto ones() -> Vec< TDim, TVal >
One value constructor.
Definition Vec.hpp:106

alpaka::Vec::all
ALPAKA_NO_HOST_ACC_WARNING static ALPAKA_FN_HOST_ACC constexpr auto all(TVal const &val) -> Vec< TDim, TVal >
Single value constructor.
Definition Vec.hpp:89

alpaka::WorkDivMembers< Dim, Idx >

alpaka::test::KernelExecutionFixture
The fixture for executing a kernel on a given accelerator.
Definition KernelExecutionFixture.hpp:27

alpaka::test::KernelExecutionFixture::WorkDiv
WorkDivMembers< Dim, Idx > WorkDiv
Definition KernelExecutionFixture.hpp:36

alpaka::test::KernelExecutionFixture::Idx
alpaka::Idx< Acc > Idx
Definition KernelExecutionFixture.hpp:32

alpaka::test::KernelExecutionFixture::Device
Dev< Acc > Device
Definition KernelExecutionFixture.hpp:34

alpaka::test::KernelExecutionFixture::KernelExecutionFixture
KernelExecutionFixture(Queue queue, WorkDiv workDiv)
Definition KernelExecutionFixture.hpp:48

alpaka::test::KernelExecutionFixture::KernelExecutionFixture
KernelExecutionFixture(WorkDiv workDiv)
Definition KernelExecutionFixture.hpp:38

alpaka::test::KernelExecutionFixture::Acc
TAcc Acc
Definition KernelExecutionFixture.hpp:29

alpaka::test::KernelExecutionFixture::Queue
test::DefaultQueue< Device > Queue
Definition KernelExecutionFixture.hpp:35

alpaka::test::KernelExecutionFixture::Platform
alpaka::Platform< Acc > Platform
Definition KernelExecutionFixture.hpp:33

alpaka::test::KernelExecutionFixture::KernelExecutionFixture
KernelExecutionFixture(Queue queue, TExtent const &extent)
Definition KernelExecutionFixture.hpp:57

alpaka::test::KernelExecutionFixture::KernelExecutionFixture
KernelExecutionFixture(TExtent const &extent)
Definition KernelExecutionFixture.hpp:43

alpaka::test::KernelExecutionFixture::Dim
alpaka::Dim< Acc > Dim
Definition KernelExecutionFixture.hpp:31

alpaka::test::KernelExecutionFixture::operator()
auto operator()(TKernelFnObj kernelFnObj, TArgs &&... args) -> bool
Definition KernelExecutionFixture.hpp:66

alpaka::test::KernelExecutionFixture::Tag
alpaka::AccToTag< Acc > Tag
Definition KernelExecutionFixture.hpp:30

alpaka::test
The test specifics.
Definition TestAccs.hpp:27

alpaka::test::DefaultQueue
typename trait::DefaultQueueType< TDev >::type DefaultQueue
The queue type that should be used for the given device.
Definition Queue.hpp:108

alpaka
The alpaka accelerator library.
Definition AccCpuOmp2Blocks.hpp:52

alpaka::Idx
typename trait::IdxType< T >::type Idx
Definition Traits.hpp:29

alpaka::memcpy
ALPAKA_FN_HOST auto memcpy(TQueue &queue, alpaka::detail::DevGlobalImplGeneric< TTag, TTypeDst > &viewDst, TViewSrc const &viewSrc) -> void
Definition DeviceGlobalCpu.hpp:61

alpaka::getValidWorkDiv
ALPAKA_FN_HOST auto getValidWorkDiv(KernelCfg< TAcc, TGridElemExtent, TThreadElemExtent > const &kernelCfg, TDev const &dev, TKernelFnObj const &kernelFnObj, TArgs &&... args) -> WorkDivMembers< Dim< TAcc >, Idx< TAcc > >
Definition WorkDivHelpers.hpp:362

alpaka::Dev
typename trait::DevType< T >::type Dev
The device type trait alias template to remove the ::type.
Definition Traits.hpp:56

alpaka::getPtrNative
ALPAKA_FN_HOST auto getPtrNative(TView const &view) -> Elem< TView > const *
Gets the native pointer of the memory view.
Definition Traits.hpp:139

alpaka::memset
ALPAKA_FN_HOST auto memset(TQueue &queue, TViewFwd &&view, std::uint8_t const &byte, TExtent const &extent) -> void
Sets the bytes of the memory of view, described by extent, to the given value.
Definition Traits.hpp:252

alpaka::getDevByIdx
ALPAKA_FN_HOST auto getDevByIdx(TPlatform const &platform, std::size_t const &devIdx) -> Dev< TPlatform >
Definition Traits.hpp:62

alpaka::getDev
ALPAKA_FN_HOST auto getDev(T const &t)
Definition Traits.hpp:68

alpaka::wait
ALPAKA_FN_HOST auto wait(TAwaited const &awaited) -> void
Waits the thread for the completion of the given awaited action to complete.
Definition Traits.hpp:34

alpaka::Platform
typename trait::PlatformType< T >::type Platform
The platform type trait alias template to remove the ::type.
Definition Traits.hpp:51

alpaka::Dim
typename trait::DimType< T >::type Dim
The dimension type trait alias template to remove the ::type.
Definition Traits.hpp:19

alpaka::AccToTag
typename trait::AccToTag< TAcc >::type AccToTag
maps an acc type to a tag type
Definition Tag.hpp:67

std
STL namespace.

alpaka::KernelCfg
Kernel start configuration to determine a valid work division.
Definition WorkDivHelpers.hpp:320

alpaka::PlatformCpu
The CPU device platform.
Definition PlatformCpu.hpp:18