llama/BitPackedInt_8hpp_source.html

 // Copyright 2023 Bernhard Manfred Gruber

 // SPDX-License-Identifier: MPL-2.0


 #pragma once


 #include "../Core.hpp"

 #include "../ProxyRefOpMixin.hpp"

 #include "Common.hpp"


 #include <climits>

 #include <type_traits>


 namespace llama::mapping

 {

     LLAMA_EXPORT

     enum class SignBit

     {

         Keep,

         Discard

     };


     namespace internal

     {

         template<typename Integral>

         LLAMA_FN_HOST_ACC_INLINE constexpr auto makeMask(Integral bits) -> Integral

         {

             return bits >= sizeof(Integral) * CHAR_BIT ? ~Integral{0} : (Integral{1} << bits) - 1u;

         }


         template<bool KeepSignBit, typename Integral, typename StoredIntegral>

         LLAMA_FN_HOST_ACC_INLINE constexpr auto bitunpack(

             const StoredIntegral* ptr,

             StoredIntegral bitOffset,

             StoredIntegral bitCount) -> Integral

         {

             constexpr auto bitsPerIntegral = static_cast<StoredIntegral>(sizeof(Integral) * CHAR_BIT);

             constexpr auto bitsPerStoredIntegral = static_cast<StoredIntegral>(sizeof(StoredIntegral) * CHAR_BIT);

             static_assert(bitsPerIntegral <= bitsPerStoredIntegral);

             assert(bitCount > 0 && bitCount <= bitsPerStoredIntegral);

 #ifdef __clang__

             // this is necessary to silence the clang static analyzer

             __builtin_assume(bitCount > 0 && bitCount <= bitsPerStoredIntegral);

 #endif


             const auto* p = ptr + bitOffset / bitsPerStoredIntegral;

             const auto innerBitOffset = bitOffset % bitsPerStoredIntegral;

             //            assert(p < endPtr);

             auto v = p[0] >> innerBitOffset;


             const auto innerBitEndOffset = innerBitOffset + bitCount;

             if(innerBitEndOffset <= bitsPerStoredIntegral)

             {

                 const auto mask = makeMask(bitCount);

                 v &= mask;

             }

             else

             {

                 const auto excessBits = innerBitEndOffset - bitsPerStoredIntegral;

                 const auto bitsLoaded = bitsPerStoredIntegral - innerBitOffset;

                 const auto mask = makeMask(excessBits);

                 //                assert(p + 1 < endPtr);

                 v |= (p[1] & mask) << bitsLoaded;

             }

             if constexpr(std::is_signed_v<Integral> && KeepSignBit)

             {

                 // perform sign extension

                 if((v & (StoredIntegral{1} << (bitCount - 1))) && bitCount < bitsPerStoredIntegral)

                     v |= ~StoredIntegral{0} << bitCount;

             }

             return static_cast<Integral>(v);

         }


         template<bool KeepSignBit, typename StoredIntegral, typename Integral>

         LLAMA_FN_HOST_ACC_INLINE constexpr void bitpack(

             StoredIntegral* ptr,

             StoredIntegral bitOffset,

             StoredIntegral bitCount,

             Integral value)

         {

             constexpr auto bitsPerIntegral = static_cast<StoredIntegral>(sizeof(Integral) * CHAR_BIT);

             constexpr auto bitsPerStoredIntegral = static_cast<StoredIntegral>(sizeof(StoredIntegral) * CHAR_BIT);

             static_assert(bitsPerIntegral <= bitsPerStoredIntegral);

             assert(bitCount > 0 && bitCount <= bitsPerStoredIntegral);

 #ifdef __clang__

             // this is necessary to silence the clang static analyzer

             __builtin_assume(bitCount > 0 && bitCount <= bitsPerStoredIntegral);

 #endif


             // NOLINTNEXTLINE(bugprone-signed-char-misuse,cert-str34-c)

             const auto unsignedValue = static_cast<StoredIntegral>(value);

             const auto mask = makeMask(bitCount);

             StoredIntegral valueBits;

             if constexpr(std::is_signed_v<Integral> && KeepSignBit)

             {

                 const auto magnitudeMask = makeMask(bitCount - 1);

                 const auto isSigned = value < 0;

                 valueBits = (StoredIntegral{isSigned} << (bitCount - 1)) | (unsignedValue & magnitudeMask);

             }

             else

             {

                 valueBits = unsignedValue & mask;

             }


             auto* p = ptr + bitOffset / bitsPerStoredIntegral;

             const auto innerBitOffset = bitOffset % bitsPerStoredIntegral;


             {

                 const auto clearMask = ~(mask << innerBitOffset);

                 //                assert(p < endPtr);

                 auto mem = p[0] & clearMask; // clear previous bits

                 mem |= valueBits << innerBitOffset; // write new bits

                 p[0] = mem;

             }


             const auto innerBitEndOffset = innerBitOffset + bitCount;

             if(innerBitEndOffset > bitsPerStoredIntegral)

             {

                 const auto excessBits = innerBitEndOffset - bitsPerStoredIntegral;

                 const auto bitsWritten = bitsPerStoredIntegral - innerBitOffset;

                 const auto clearMask = ~makeMask(excessBits);

                 //                assert(p + 1 < endPtr);

                 auto mem = p[1] & clearMask; // clear previous bits

                 mem |= valueBits >> bitsWritten; // write new bits

                 p[1] = mem;

             }

         }


         template<typename Integral, typename StoredIntegral>

         LLAMA_FN_HOST_ACC_INLINE constexpr auto bitunpack1(const StoredIntegral* ptr, StoredIntegral bitOffset)

             -> Integral

         {

             constexpr auto bitsPerStoredIntegral = static_cast<StoredIntegral>(sizeof(StoredIntegral) * CHAR_BIT);

             const auto bit

                 = (ptr[bitOffset / bitsPerStoredIntegral] >> (bitOffset % bitsPerStoredIntegral)) & StoredIntegral{1};

             return static_cast<Integral>(bit);

         }


         template<typename StoredIntegral, typename Integral>

         LLAMA_FN_HOST_ACC_INLINE constexpr void bitpack1(StoredIntegral* ptr, StoredIntegral bitOffset, Integral value)

         {

             constexpr auto bitsPerStoredIntegral = static_cast<StoredIntegral>(sizeof(StoredIntegral) * CHAR_BIT);

             const auto bitOff = bitOffset % bitsPerStoredIntegral;

             auto& dst = ptr[bitOffset / bitsPerStoredIntegral];

             dst &= ~(StoredIntegral{1} << bitOff); // clear bit

             const auto bit = (static_cast<StoredIntegral>(value) & StoredIntegral{1});

             dst |= (bit << bitOff); // set bit

         }


         template<typename Integral, typename StoredIntegralCV, typename VHBits, typename SizeType, SignBit SignBit>

         // NOLINTNEXTLINE(cppcoreguidelines-special-member-functions,hicpp-special-member-functions)

         struct BitPackedIntRef

             : private VHBits

             , ProxyRefOpMixin<BitPackedIntRef<Integral, StoredIntegralCV, VHBits, SizeType, SignBit>, Integral>

         {

         private:

             using StoredIntegral = std::remove_cv_t<StoredIntegralCV>;

             StoredIntegralCV* ptr;

             SizeType bitOffset;


         public:

             using value_type = Integral;


             LLAMA_FN_HOST_ACC_INLINE constexpr BitPackedIntRef(

                 StoredIntegralCV* ptr,

                 SizeType bitOffset,

                 VHBits vhBits)

                 : VHBits{vhBits}

                 , ptr{ptr}

                 , bitOffset{bitOffset}

             {

             }


             BitPackedIntRef(const BitPackedIntRef&) = default;


             // NOLINTNEXTLINE(bugprone-unhandled-self-assignment,cert-oop54-cpp)

             LLAMA_FN_HOST_ACC_INLINE constexpr auto operator=(const BitPackedIntRef& other) -> BitPackedIntRef&

             {

                 *this = static_cast<value_type>(other);

                 return *this;

             }


             // NOLINTNEXTLINE(google-explicit-constructor,hicpp-explicit-conversions)

             LLAMA_FN_HOST_ACC_INLINE constexpr operator Integral() const

             {

                 // fast path for single bits without sign handling

                 if constexpr(std::is_empty_v<VHBits>)

                 {

                     if constexpr(VHBits::value() == 1 && (std::is_unsigned_v<Integral> || SignBit == SignBit::Discard))

                     {

                         return bitunpack1<Integral>(ptr, static_cast<StoredIntegral>(bitOffset));

                     }

                 }


                 return bitunpack<SignBit == SignBit::Keep, Integral>(

                     ptr,

                     static_cast<StoredIntegral>(bitOffset),

                     static_cast<StoredIntegral>(VHBits::value()));

             }


             LLAMA_FN_HOST_ACC_INLINE constexpr auto operator=(Integral value) -> BitPackedIntRef&

             {

                 // fast path for single bits without sign handling

                 if constexpr(std::is_empty_v<VHBits>)

                 {

                     if constexpr(VHBits::value() == 1 && (std::is_unsigned_v<Integral> || SignBit == SignBit::Discard))

                     {

                         bitpack1(ptr, static_cast<StoredIntegral>(bitOffset), value);

                     }

                 }


                 bitpack<SignBit == SignBit::Keep>(

                     ptr,

                     static_cast<StoredIntegral>(bitOffset),

                     static_cast<StoredIntegral>(VHBits::value()),

                     value);

                 return *this;

             }

         };


         template<typename A, typename B>

         using HasLargerSize = mp_bool<sizeof(A) < sizeof(B)>;


         template<typename RecordDim>

         using LargestIntegral = mp_max_element<FlatRecordDim<RecordDim>, HasLargerSize>;


         template<typename RecordDim>

         using StoredUnsignedFor = std::

             conditional_t<(sizeof(LargestIntegral<RecordDim>) > sizeof(std::uint32_t)), std::uint64_t, std::uint32_t>;


         template<

             typename TArrayExtents,

             typename TRecordDim,

             typename Bits,

             SignBit SignBit,

             typename TLinearizeArrayIndexFunctor,

             typename TStoredIntegral>

         struct BitPackedIntCommon

             : MappingBase<TArrayExtents, TRecordDim>

             , protected llama::internal::BoxedValue<Bits>

         {

             using LinearizeArrayIndexFunctor = TLinearizeArrayIndexFunctor;

             using StoredIntegral = TStoredIntegral;


             static_assert(std::is_integral_v<StoredIntegral>);

             static_assert(std::is_unsigned_v<StoredIntegral>);


             // We could allow more integer types as storage type, but that needs to be thought through carefully

             static_assert(

                 std::is_same_v<StoredIntegral, std::uint32_t> || std::is_same_v<StoredIntegral, std::uint64_t>);


         protected:

             using Base = MappingBase<TArrayExtents, TRecordDim>;

             using VHBits = llama::internal::BoxedValue<Bits>;

             using size_type = typename TArrayExtents::value_type;


             template<typename T>

             using IsAllowedFieldType = mp_or<std::is_integral<T>, std::is_enum<T>>;


             static_assert(

                 mp_all_of<FlatRecordDim<TRecordDim>, IsAllowedFieldType>::value,

                 "All record dimension field types must be integral");


             template<typename T>

             using IsFieldTypeSmallerOrEqualStorageIntegral = mp_bool<sizeof(T) <= sizeof(StoredIntegral)>;


             static_assert(

                 mp_all_of<FlatRecordDim<TRecordDim>, IsFieldTypeSmallerOrEqualStorageIntegral>::value,

                 "The integral type used for storage must be at least as big as the type of the values to retrieve");


         public:

             LLAMA_FN_HOST_ACC_INLINE

             constexpr auto bits() const -> size_type

             {

                 return static_cast<size_type>(VHBits::value());

             }


             template<typename B = Bits, std::enable_if_t<isConstant<B>, int> = 0>

             LLAMA_FN_HOST_ACC_INLINE constexpr explicit BitPackedIntCommon(

                 TArrayExtents extents = {},

                 Bits bits = {},

                 TRecordDim = {})

                 : Base(extents)

                 , VHBits{bits}

             {

                 static_assert(VHBits::value() > 0);

                 mp_for_each_inline<mp_transform<mp_identity, FlatRecordDim<TRecordDim>>>(

                     [&](auto t)

                     {

                         using FieldType = typename decltype(t)::type;

                         static_assert(

                             static_cast<std::size_t>(VHBits::value()) <= sizeof(FieldType) * CHAR_BIT,

                             "Storage bits must not be greater than bits of field type");

                         static_assert(

                             VHBits::value() >= 2

                                 || std::is_unsigned_v<FieldType> || SignBit == llama::mapping::SignBit::Discard,

                             "When keeping the sign bit, Bits must be at least 2 with signed integers in the record "

                             "dimension");

                     });

             }


             template<typename B = Bits, std::enable_if_t<!isConstant<B>, int> = 0>

             LLAMA_FN_HOST_ACC_INLINE constexpr explicit BitPackedIntCommon(

                 TArrayExtents extents,

                 Bits bits,

                 TRecordDim = {})

                 : Base(extents)

                 , VHBits{bits}

             {

 #ifdef __CUDA_ARCH__

                 assert(VHBits::value() > 0);

 #else

                 if(VHBits::value() <= 0)

                     throw std::invalid_argument("BitPackedInt* Bits must not be zero");

 #endif

                 mp_for_each_inline<mp_transform<mp_identity, FlatRecordDim<TRecordDim>>>(

                     [&](auto t)

                     {

                         using FieldType [[maybe_unused]] = typename decltype(t)::type;

 #ifdef __CUDA_ARCH__

                         assert(VHBits::value() <= sizeof(FieldType) * CHAR_BIT);

 #else

                         if(static_cast<std::size_t>(VHBits::value()) > sizeof(FieldType) * CHAR_BIT)

                             throw std::invalid_argument(

                                 "BitPackedInt* Bits must not be larger than any field type in the record dimension");

                         if(!(VHBits::value() >= 2

                              || std::is_unsigned_v<FieldType> || SignBit == llama::mapping::SignBit::Discard))

                             throw std::invalid_argument("When keeping the sign bit, Bits must be at least 2 with "

                                                         "signed integers in the record "

                                                         "dimension");

 #endif

                     });

             }


             template<std::size_t... RecordCoords>

             static constexpr auto isComputed(RecordCoord<RecordCoords...>)

             {

                 return true;

             }

         };

     } // namespace internal


     LLAMA_EXPORT

     template<

         typename TArrayExtents,

         typename TRecordDim,

         typename Bits = typename TArrayExtents::value_type,

         SignBit SignBit = SignBit::Keep,

         typename TLinearizeArrayIndexFunctor = LinearizeArrayIndexRight,

         typename TStoredIntegral = internal::StoredUnsignedFor<TRecordDim>>

     struct BitPackedIntSoA

         : internal::BitPackedIntCommon<

               TArrayExtents,

               TRecordDim,

               Bits,

               SignBit,

               TLinearizeArrayIndexFunctor,

               TStoredIntegral>

     {

     private:

         using Base = internal::

             BitPackedIntCommon<TArrayExtents, TRecordDim, Bits, SignBit, TLinearizeArrayIndexFunctor, TStoredIntegral>;


     public:

         using Base::Base;

         using typename Base::size_type;

         using VHBits = typename Base::VHBits; // use plain using declaration with nvcc >= 11.8


         static constexpr std::size_t blobCount = mp_size<FlatRecordDim<TRecordDim>>::value;


         LLAMA_FN_HOST_ACC_INLINE

         constexpr auto blobSize(size_type /*blobIndex*/) const -> size_type

         {

             constexpr auto bitsPerStoredIntegral = static_cast<size_type>(sizeof(TStoredIntegral) * CHAR_BIT);

             const auto bitsNeeded = TLinearizeArrayIndexFunctor{}.size(Base::extents()) * VHBits::value();

             return roundUpToMultiple(bitsNeeded, bitsPerStoredIntegral) / CHAR_BIT;

         }


         template<std::size_t... RecordCoords, typename Blobs>

         LLAMA_FN_HOST_ACC_INLINE constexpr auto compute(

             typename Base::ArrayIndex ai,

             RecordCoord<RecordCoords...>,

             Blobs& blobs) const

         {

             constexpr auto blob = flatRecordCoord<TRecordDim, RecordCoord<RecordCoords...>>;

             const auto bitOffset = TLinearizeArrayIndexFunctor{}(ai, Base::extents()) * VHBits::value();


             using QualifiedStoredIntegral = CopyConst<Blobs, TStoredIntegral>;

             using DstType = GetType<TRecordDim, RecordCoord<RecordCoords...>>;

             LLAMA_BEGIN_SUPPRESS_HOST_DEVICE_WARNING

             return internal::BitPackedIntRef<DstType, QualifiedStoredIntegral, VHBits, size_type, SignBit>{

                 reinterpret_cast<QualifiedStoredIntegral*>(&blobs[blob][0]),

                 bitOffset,

                 static_cast<const VHBits&>(*this)};

             LLAMA_END_SUPPRESS_HOST_DEVICE_WARNING

         }

     };


     LLAMA_EXPORT

     template<

         typename Bits = void,

         SignBit SignBit = SignBit::Keep,

         typename LinearizeArrayIndexFunctor = mapping::LinearizeArrayIndexRight,

         typename StoredIntegral = void>

     struct BindBitPackedIntSoA

     {

         template<typename ArrayExtents, typename RecordDim>

         using fn = BitPackedIntSoA<

             ArrayExtents,

             RecordDim,

             std::conditional_t<!std::is_void_v<Bits>, Bits, typename ArrayExtents::value_type>,

             SignBit,

             LinearizeArrayIndexFunctor,

             std::conditional_t<

                 !std::is_void_v<StoredIntegral>,

                 StoredIntegral,

                 internal::StoredUnsignedFor<RecordDim>>>;

     };


     LLAMA_EXPORT

     template<typename Mapping>

     inline constexpr bool isBitPackedIntSoA = false;


     LLAMA_EXPORT

     template<

         typename ArrayExtents,

         typename RecordDim,

         typename Bits,

         SignBit SignBit,

         typename LinearizeArrayIndexFunctor,

         typename StoredIntegral>

     inline constexpr bool isBitPackedIntSoA<

         BitPackedIntSoA<ArrayExtents, RecordDim, Bits, SignBit, LinearizeArrayIndexFunctor, StoredIntegral>>

         = true;


     //  PermuteFieldsInOrder, \ref PermuteFieldsIncreasingAlignment, \ref PermuteFieldsDecreasingAlignment and

     //  \ref PermuteFieldsMinimizePadding.

     LLAMA_EXPORT

     template<

         typename TArrayExtents,

         typename TRecordDim,

         typename Bits = typename TArrayExtents::value_type,

         SignBit SignBit = SignBit::Keep,

         typename TLinearizeArrayIndexFunctor = LinearizeArrayIndexRight,

         template<typename> typename PermuteFields = PermuteFieldsInOrder,

         typename TStoredIntegral = internal::StoredUnsignedFor<TRecordDim>>

     struct BitPackedIntAoS

         : internal::BitPackedIntCommon<

               TArrayExtents,

               TRecordDim,

               Bits,

               SignBit,

               TLinearizeArrayIndexFunctor,

               TStoredIntegral>

     {

     private:

         using Base = internal::

             BitPackedIntCommon<TArrayExtents, TRecordDim, Bits, SignBit, TLinearizeArrayIndexFunctor, TStoredIntegral>;


     public:

         using Base::Base;

         using typename Base::size_type;

         using VHBits = typename Base::VHBits; // use plain using declaration with nvcc >= 11.8


         using Permuter = PermuteFields<TRecordDim>;

         static constexpr std::size_t blobCount = 1;


         LLAMA_FN_HOST_ACC_INLINE

         constexpr auto blobSize(size_type /*blobIndex*/) const -> size_type

         {

             constexpr auto bitsPerStoredIntegral = static_cast<size_type>(sizeof(TStoredIntegral) * CHAR_BIT);

             const auto bitsNeeded = TLinearizeArrayIndexFunctor{}.size(Base::extents())

                 * static_cast<size_type>(VHBits::value()) * static_cast<size_type>(flatFieldCount<TRecordDim>);

             return roundUpToMultiple(bitsNeeded, bitsPerStoredIntegral) / CHAR_BIT;

         }


         template<std::size_t... RecordCoords, typename Blobs>

         LLAMA_FN_HOST_ACC_INLINE constexpr auto compute(

             typename Base::ArrayIndex ai,

             RecordCoord<RecordCoords...>,

             Blobs& blobs) const

         {

             constexpr auto flatFieldIndex = static_cast<size_type>(

                 Permuter::template permute<flatRecordCoord<TRecordDim, RecordCoord<RecordCoords...>>>);

             const auto bitOffset = ((TLinearizeArrayIndexFunctor{}(ai, Base::extents())

                                      * static_cast<size_type>(flatFieldCount<TRecordDim>))

                                     + flatFieldIndex)

                 * static_cast<size_type>(VHBits::value());


             using QualifiedStoredIntegral = CopyConst<Blobs, TStoredIntegral>;

             using DstType = GetType<TRecordDim, RecordCoord<RecordCoords...>>;

             LLAMA_BEGIN_SUPPRESS_HOST_DEVICE_WARNING

             return internal::BitPackedIntRef<DstType, QualifiedStoredIntegral, VHBits, size_type, SignBit>{

                 reinterpret_cast<QualifiedStoredIntegral*>(&blobs[0][0]),

                 bitOffset,

                 static_cast<const VHBits&>(*this)};

             LLAMA_END_SUPPRESS_HOST_DEVICE_WARNING

         }

     };


     LLAMA_EXPORT

     template<

         typename Bits = void,

         SignBit SignBit = SignBit::Keep,

         typename LinearizeArrayIndexFunctor = mapping::LinearizeArrayIndexRight,

         template<typename> typename PermuteFields = PermuteFieldsInOrder,

         typename StoredIntegral = void>

     struct BindBitPackedIntAoS

     {

         template<typename ArrayExtents, typename RecordDim>

         using fn = BitPackedIntAoS<

             ArrayExtents,

             RecordDim,

             std::conditional_t<!std::is_void_v<Bits>, Bits, typename ArrayExtents::value_type>,

             SignBit,

             LinearizeArrayIndexFunctor,

             PermuteFields,

             std::conditional_t<

                 !std::is_void_v<StoredIntegral>,

                 StoredIntegral,

                 internal::StoredUnsignedFor<RecordDim>>>;

     };


     LLAMA_EXPORT

     template<typename Mapping>

     inline constexpr bool isBitPackedIntAoS = false;


     template<

         typename ArrayExtents,

         typename RecordDim,

         typename Bits,

         SignBit SignBit,

         typename LinearizeArrayIndexFunctor,

         template<typename>

         typename PermuteFields,

         typename StoredIntegral>

     inline constexpr bool isBitPackedIntAoS<BitPackedIntAoS<

         ArrayExtents,

         RecordDim,

         Bits,

         SignBit,

         LinearizeArrayIndexFunctor,

         PermuteFields,

         StoredIntegral>>

         = true;

 } // namespace llama::mapping

Common.hpp

LLAMA_EXPORT
#define LLAMA_EXPORT
Definition: macros.hpp:192

LLAMA_BEGIN_SUPPRESS_HOST_DEVICE_WARNING
#define LLAMA_BEGIN_SUPPRESS_HOST_DEVICE_WARNING
Definition: macros.hpp:141

LLAMA_FN_HOST_ACC_INLINE
#define LLAMA_FN_HOST_ACC_INLINE
Definition: macros.hpp:96

LLAMA_END_SUPPRESS_HOST_DEVICE_WARNING
#define LLAMA_END_SUPPRESS_HOST_DEVICE_WARNING
Definition: macros.hpp:153

llama::mapping::internal::bitunpack1
constexpr auto bitunpack1(const StoredIntegral *ptr, StoredIntegral bitOffset) -> Integral
Definition: BitPackedInt.hpp:129

llama::mapping::internal::makeMask
constexpr auto makeMask(Integral bits) -> Integral
Definition: BitPackedInt.hpp:25

llama::mapping::internal::bitpack1
constexpr void bitpack1(StoredIntegral *ptr, StoredIntegral bitOffset, Integral value)
Definition: BitPackedInt.hpp:139

llama::mapping::internal::StoredUnsignedFor
std::conditional_t<(sizeof(LargestIntegral< RecordDim >) > sizeof(std::uint32_t)), std::uint64_t, std::uint32_t > StoredUnsignedFor
Definition: BitPackedInt.hpp:233

llama::mapping::internal::bitunpack
constexpr auto bitunpack(const StoredIntegral *ptr, StoredIntegral bitOffset, StoredIntegral bitCount) -> Integral
Definition: BitPackedInt.hpp:31

llama::mapping::internal::bitpack
constexpr void bitpack(StoredIntegral *ptr, StoredIntegral bitOffset, StoredIntegral bitCount, Integral value)
Definition: BitPackedInt.hpp:74

llama::mapping::internal::HasLargerSize
mp_bool< sizeof(A)< sizeof(B)> HasLargerSize
Definition: BitPackedInt.hpp:226

llama::mapping::internal::LargestIntegral
mp_max_element< FlatRecordDim< RecordDim >, HasLargerSize > LargestIntegral
Definition: BitPackedInt.hpp:229

llama::mapping
Definition: AoS.hpp:9

llama::mapping::isBitPackedIntAoS
constexpr bool isBitPackedIntAoS
Definition: BitPackedInt.hpp:557

llama::mapping::isBitPackedIntSoA
constexpr bool isBitPackedIntSoA
Definition: BitPackedInt.hpp:439

llama::mapping::Blobs
Blobs
Definition: SoA.hpp:14

llama::mapping::SignBit
SignBit
Definition: BitPackedInt.hpp:17

llama::mapping::SignBit::Keep
@ Keep

llama::mapping::SignBit::Discard
@ Discard

llama::FlatRecordDim
typename internal::FlattenRecordDimImpl< RecordDim >::type FlatRecordDim
Returns a flat type list containing all leaf field types of the given record dimension.
Definition: Core.hpp:481

llama::ArrayExtents
ArrayExtents(Args...) -> ArrayExtents< typename internal::IndexTypeFromArgs< std::size_t, Args... >::type,(Args{}, dyn)... >

llama::flatRecordCoord
constexpr std::size_t flatRecordCoord
Definition: Core.hpp:517

llama::CopyConst
std::conditional_t< std::is_const_v< FromT >, const ToT, ToT > CopyConst
Alias for ToT, adding const if FromT is const qualified.
Definition: Core.hpp:824

llama::roundUpToMultiple
constexpr auto roundUpToMultiple(Integral n, Integral mult) -> Integral
Returns the integral n rounded up to be a multiple of mult.
Definition: Core.hpp:578

llama::GetType
typename internal::GetTypeImpl< RecordDim, RecordCoordOrTags... >::type GetType
Definition: Core.hpp:388

llama::ArrayExtents::value_type
T value_type
Definition: ArrayExtents.hpp:141

llama::ProxyRefOpMixin
CRTP mixin for proxy reference types to support all compound assignment and increment/decrement opera...
Definition: ProxyRefOpMixin.hpp:14

llama::RecordCoord
Definition: RecordCoord.hpp:20

llama::internal::BoxedValue
Definition: Core.hpp:855

llama::internal::BoxedValue< Bits >::value
constexpr auto value() const
Definition: Core.hpp:864

llama::mapping::BindBitPackedIntAoS
Definition: BitPackedInt.hpp:540

llama::mapping::BindBitPackedIntSoA
Definition: BitPackedInt.hpp:423

llama::mapping::BitPackedIntAoS
Definition: BitPackedInt.hpp:484

llama::mapping::BitPackedIntAoS::blobCount
static constexpr std::size_t blobCount
Definition: BitPackedInt.hpp:495

llama::mapping::BitPackedIntAoS::compute
constexpr auto compute(typename Base::ArrayIndex ai, RecordCoord< RecordCoords... >, Blobs &blobs) const
Definition: BitPackedInt.hpp:507

llama::mapping::BitPackedIntAoS::Permuter
PermuteFields< TRecordDim > Permuter
Definition: BitPackedInt.hpp:494

llama::mapping::BitPackedIntAoS::VHBits
typename Base::VHBits VHBits
Definition: BitPackedInt.hpp:492

llama::mapping::BitPackedIntAoS::blobSize
constexpr auto blobSize(size_type) const -> size_type
Definition: BitPackedInt.hpp:498

llama::mapping::BitPackedIntSoA
Definition: BitPackedInt.hpp:374

llama::mapping::BitPackedIntSoA::VHBits
typename Base::VHBits VHBits
Definition: BitPackedInt.hpp:382

llama::mapping::BitPackedIntSoA::compute
constexpr auto compute(typename Base::ArrayIndex ai, RecordCoord< RecordCoords... >, Blobs &blobs) const
Definition: BitPackedInt.hpp:395

llama::mapping::BitPackedIntSoA::blobCount
static constexpr std::size_t blobCount
Definition: BitPackedInt.hpp:384

llama::mapping::BitPackedIntSoA::blobSize
constexpr auto blobSize(size_type) const -> size_type
Definition: BitPackedInt.hpp:387

llama::mapping::LinearizeArrayIndexRight
Definition: Common.hpp:46

llama::mapping::MappingBase
Definition: Common.hpp:19

llama::mapping::MappingBase::size_type
typename ArrayExtents::value_type size_type
Definition: Common.hpp:25

llama::mapping::MappingBase::ArrayIndex
typename ArrayExtents::Index ArrayIndex
Definition: Common.hpp:24

llama::mapping::MappingBase::extents
constexpr auto extents() const -> ArrayExtents
Definition: Common.hpp:35

llama::mapping::PermuteFieldsInOrder
Retains the order of the record dimension's fields.
Definition: Common.hpp:182

llama::mapping::internal::BitPackedIntCommon
Definition: BitPackedInt.hpp:245

llama::mapping::internal::BitPackedIntCommon::BitPackedIntCommon
constexpr BitPackedIntCommon(TArrayExtents extents, Bits bits, TRecordDim={})
Definition: BitPackedInt.hpp:307

llama::mapping::internal::BitPackedIntCommon::Base
MappingBase< TArrayExtents, TRecordDim > Base
Definition: BitPackedInt.hpp:257

llama::mapping::internal::BitPackedIntCommon::size_type
typename TArrayExtents::value_type size_type
Definition: BitPackedInt.hpp:259

llama::mapping::internal::BitPackedIntCommon::BitPackedIntCommon
constexpr BitPackedIntCommon(TArrayExtents extents={}, Bits bits={}, TRecordDim={})
Definition: BitPackedInt.hpp:283

llama::mapping::internal::BitPackedIntCommon::IsAllowedFieldType
mp_or< std::is_integral< T >, std::is_enum< T > > IsAllowedFieldType
Definition: BitPackedInt.hpp:262

llama::mapping::internal::BitPackedIntCommon::LinearizeArrayIndexFunctor
TLinearizeArrayIndexFunctor LinearizeArrayIndexFunctor
Definition: BitPackedInt.hpp:246

llama::mapping::internal::BitPackedIntCommon::IsFieldTypeSmallerOrEqualStorageIntegral
mp_bool< sizeof(T)<=sizeof(StoredIntegral)> IsFieldTypeSmallerOrEqualStorageIntegral
Definition: BitPackedInt.hpp:269

llama::mapping::internal::BitPackedIntCommon::isComputed
static constexpr auto isComputed(RecordCoord< RecordCoords... >)
Definition: BitPackedInt.hpp:340

llama::mapping::internal::BitPackedIntCommon::VHBits
llama::internal::BoxedValue< Bits > VHBits
Definition: BitPackedInt.hpp:258

llama::mapping::internal::BitPackedIntCommon::StoredIntegral
TStoredIntegral StoredIntegral
Definition: BitPackedInt.hpp:247

llama::mapping::internal::BitPackedIntCommon::bits
constexpr auto bits() const -> size_type
Definition: BitPackedInt.hpp:277

llama::mapping::internal::BitPackedIntRef
Definition: BitPackedInt.hpp:159

llama::mapping::internal::BitPackedIntRef::value_type
Integral value_type
Definition: BitPackedInt.hpp:166

llama::mapping::internal::BitPackedIntRef::BitPackedIntRef
BitPackedIntRef(const BitPackedIntRef &)=default

llama::mapping::internal::BitPackedIntRef::operator=
constexpr auto operator=(Integral value) -> BitPackedIntRef &
Definition: BitPackedInt.hpp:205

llama::mapping::internal::BitPackedIntRef::BitPackedIntRef
constexpr BitPackedIntRef(StoredIntegralCV *ptr, SizeType bitOffset, VHBits vhBits)
Definition: BitPackedInt.hpp:168

llama::mapping::internal::BitPackedIntRef::operator=
constexpr auto operator=(const BitPackedIntRef &other) -> BitPackedIntRef &
Definition: BitPackedInt.hpp:181