DNDSR/doxygen/ArrayEigenMatrixBatch__DeviceView_8hpp_source.html

#pragma once

/// @file ArrayEigenMatrixBatch_DeviceView.hpp

/// @brief Device-callable views and on-buffer matrix-batch helpers for

/// @ref DNDS::ArrayEigenMatrixBatch "ArrayEigenMatrixBatch" (variable-sized matrix batches per row).

///

/// Also defines a `MatrixBatch<real_T>` utility class that packs multiple

/// variable-shaped matrices into a single flat buffer using 32-bit size-pair

/// headers so each row can self-describe its matrix shapes.


#include "../DeviceView.hpp"

#include "DNDS/Defines.hpp"

#include "DNDS/DeviceStorage.hpp"

#include "Eigen/src/Core/Matrix.h"

#include "Eigen/src/Core/util/Constants.h"

#include <cstddef>

#include <type_traits>


namespace DNDS

{

    /**

     * @brief Packed variable-shape matrix-batch layout inside a flat buffer.

     *

     * @details Each row of @ref DNDS::ArrayEigenMatrixBatch "ArrayEigenMatrixBatch" stores several matrices whose

     * shapes may differ. @ref DNDS::MatrixBatch "MatrixBatch" provides:

     *  - nested @ref DNDS::UInt32PairIn64 "UInt32PairIn64" / @ref DNDS::UInt16QuadIn64 "UInt16QuadIn64" helpers to pack two 32-bit

     *    (or four 16-bit) integers into a single 64-bit word (matrix shape headers);

     *  - size computation (`getBufSize`) and compression (@ref CompressIn) for

     *    an input vector of Eigen matrices;

     *  - `operator()(j)` that returns an `Eigen::Map` onto the `j`-th matrix

     *    inside the already-compressed row buffer.

     *

     * The templated `real_T` allows both mutable and const variants.

     */

    template <class real_T = real>


    class MatrixBatch

    {

    public:


        struct UInt32PairIn64

        {

            uint64_t data;

            DNDS_DEVICE_CALLABLE [[nodiscard]] uint32_t getM() const { return uint32_t(data & 0x00000000FFFFFFFFULL); }

            DNDS_DEVICE_CALLABLE [[nodiscard]] uint32_t getN() const { return uint32_t(data >> 32); }

            DNDS_DEVICE_CALLABLE void setM(uint32_t v) { data = (data & 0xFFFFFFFF00000000ULL) | uint64_t(v); }

            DNDS_DEVICE_CALLABLE void setN(uint32_t v) { data = (data & 0x00000000FFFFFFFFULL) | (uint64_t(v) << 32); }

        };


        static_assert(sizeof(UInt32PairIn64) == 8);


        struct UInt16QuadIn64

        {

            uint64_t data;

            DNDS_DEVICE_CALLABLE [[nodiscard]] uint16_t getA() const { return uint16_t((data & 0x000000000000FFFFULL) >> 0); }

            DNDS_DEVICE_CALLABLE [[nodiscard]] uint16_t getB() const { return uint16_t((data & 0x00000000FFFF0000ULL) >> 16); }

            DNDS_DEVICE_CALLABLE [[nodiscard]] uint16_t getC() const { return uint16_t((data & 0x0000FFFF00000000ULL) >> 32); }

            DNDS_DEVICE_CALLABLE [[nodiscard]] uint16_t getD() const { return uint16_t((data & 0xFFFF000000000000ULL) >> 48); }


            DNDS_DEVICE_CALLABLE void setA(uint16_t v) { data = (data & (~0x000000000000FFFFULL)) | (uint64_t(v) << 0); }

            DNDS_DEVICE_CALLABLE void setB(uint16_t v) { data = (data & (~0x00000000FFFF0000ULL)) | (uint64_t(v) << 16); }

            DNDS_DEVICE_CALLABLE void setC(uint16_t v) { data = (data & (~0x0000FFFF00000000ULL)) | (uint64_t(v) << 32); }

            DNDS_DEVICE_CALLABLE void setD(uint16_t v) { data = (data & (~0xFFFF000000000000ULL)) | (uint64_t(v) << 48); }

        };


        static_assert(sizeof(UInt32PairIn64) == 8 && sizeof(UInt16QuadIn64) == 8);


        using t_matrix = Eigen::Matrix<std::remove_cv_t<real_T>, Eigen::Dynamic, Eigen::Dynamic>;

        using t_map_const = Eigen::Map<const t_matrix, Eigen::Unaligned>;

        using t_map =

            std::conditional_t<std::is_const_v<real_T>,

                               t_map_const,

                               Eigen::Map<t_matrix, Eigen::Unaligned>>;


        template <class t_matrices_elem>


        static rowsize getBufSize(const std::vector<t_matrices_elem> &matrices)

        {

            DNDS_assert(matrices.size() < DNDS_ROWSIZE_MAX);

            rowsize bufSiz = matrices.size() + 1;

            for (const auto &i : matrices)

            {

                Eigen::Index mSiz = i.rows() * i.cols();

                static_assert(std::numeric_limits<Eigen::Index>::digits > std::numeric_limits<uint32_t>::digits);

                DNDS_assert((mSiz + bufSiz) < DNDS_ROWSIZE_MAX && i.rows() <= UINT16_MAX && i.cols() <= UINT16_MAX);

                bufSiz += mSiz;

            }

            return bufSiz;

        }


    private:

        real_T *_buf;

        rowsize _buf_size;

        static_assert(sizeof(real_T) == 8 || sizeof(real_T) == 4);

        static const ptrdiff_t n_real_in_64 = 8 / sizeof(real);


        DNDS_DEVICE_CALLABLE real_T *get_kth_64_meta_block(rowsize k) { return _buf + (k + 1) * n_real_in_64; }

        DNDS_DEVICE_CALLABLE [[nodiscard]] const real_T *get_kth_64_meta_block(rowsize k) const

        {

            return (const_cast<MatrixBatch *>(this))->get_kth_64_meta_block(k);

        }


    public:


        DNDS_DEVICE_CALLABLE MatrixBatch(real_T *n_buf, rowsize new_size) : _buf(n_buf), _buf_size(new_size)

        {

        }


        DNDS_DEVICE_CALLABLE [[nodiscard]] uint64_t &Size() const

        {

            DNDS_assert(_buf_size > 0);

            return *(uint64_t *)(_buf);

        }


        DNDS_DEVICE_CALLABLE [[nodiscard]] uint16_t getNRow(rowsize k) const

        {

            DNDS_assert(k < _buf_size - 1);

            return ((UInt16QuadIn64 *)get_kth_64_meta_block(k))->getA();

        }


        DNDS_DEVICE_CALLABLE [[nodiscard]] uint16_t getNCol(rowsize k) const

        {

            DNDS_assert(k < _buf_size - 1);

            return ((UInt16QuadIn64 *)get_kth_64_meta_block(k))->getB();

        }


        DNDS_DEVICE_CALLABLE [[nodiscard]] uint32_t getOffset(rowsize k) const

        {

            DNDS_assert(k < _buf_size - 1);

            return ((UInt32PairIn64 *)get_kth_64_meta_block(k))->getN();

        }


        DNDS_DEVICE_CALLABLE void setNRow(rowsize k, uint16_t v)

        {

            DNDS_assert(k < _buf_size - 1);

            ((UInt16QuadIn64 *)get_kth_64_meta_block(k))->setA(v);

        }


        DNDS_DEVICE_CALLABLE void setNCol(rowsize k, uint16_t v)

        {

            DNDS_assert(k < _buf_size - 1);

            ((UInt16QuadIn64 *)get_kth_64_meta_block(k))->setB(v);

        }


        DNDS_DEVICE_CALLABLE void setOffset(rowsize k, uint32_t v)

        {

            DNDS_assert(k < _buf_size - 1);

            ((UInt32PairIn64 *)get_kth_64_meta_block(k))->setN(v);

        }


        template <class t_matrices_elem>


        void CompressIn(const std::vector<t_matrices_elem> &matrices)

        {

            DNDS_assert(getBufSize(matrices) <= _buf_size);

            this->Size() = uint64_t(matrices.size()); // assuming could fit

            // std::cout << "Size: " << this->Size() << std::endl;

            uint32_t curOffset = uint32_t(this->Size()) + 1;

            for (size_t i = 0; i < matrices.size(); i++)

            {

                DNDS_assert(matrices[i].rows() <= Eigen::Index(UINT16_MAX));

                DNDS_assert(matrices[i].cols() <= Eigen::Index(UINT16_MAX));

                this->setNRow(rowsize(i), uint16_t(matrices[i].rows()));

                this->setNCol(rowsize(i), uint16_t(matrices[i].cols()));

                this->setOffset(rowsize(i), curOffset);

                this->operator[](i) = matrices[i];

                // std::cout << "SET: " << this->operator[](i) << std::endl;

                static_assert(std::numeric_limits<Eigen::Index>::digits > std::numeric_limits<uint32_t>::digits);

                DNDS_assert(matrices[i].size() <= Eigen::Index(UINT32_MAX - curOffset)); // overflow check

                curOffset += matrices[i].size();

            }

        }


        DNDS_DEVICE_CALLABLE t_map


        operator[](rowsize k)

        {

            DNDS_assert(k < this->Size());

            auto n_row = getNRow(k);

            auto n_col = getNCol(k);

            auto offset = getOffset(k);

            return {_buf + offset, n_row, n_col};

        }


        DNDS_DEVICE_CALLABLE t_map_const


        operator[](rowsize k) const

        {

            DNDS_assert(k < this->Size());

            auto n_row = getNRow(k);

            auto n_col = getNCol(k);

            auto offset = getOffset(k);

            return {_buf + offset, n_row, n_col};

        }


    };


    template <DeviceBackend B, class real_T>


    class ArrayEigenMatrixBatchDeviceView : public ArrayDeviceView<B, real_T, NonUniformSize>

    {

    public:

        using t_base = ArrayDeviceView<B, real_T, NonUniformSize>;

        using t_base::t_base;


        using t_matrix = typename MatrixBatch<real_T>::t_matrix;

        using t_map = typename MatrixBatch<real_T>::t_map;

        using t_map_const = typename MatrixBatch<real_T>::t_map_const;


        using t_self = ArrayEigenMatrixBatchDeviceView<B, real_T>;


        DNDS_DEVICE_TRIVIAL_COPY_DEFINE(ArrayEigenMatrixBatchDeviceView, t_self)


        DNDS_DEVICE_CALLABLE ArrayEigenMatrixBatchDeviceView(const t_base &base_view) : t_base(base_view) {}


        DNDS_DEVICE_CALLABLE MatrixBatch<real_T> operator[](index i)

        {

            return {this->t_base::operator[](i), this->RowSize(i)};

        }


        DNDS_DEVICE_CALLABLE MatrixBatch<const real_T> operator[](index i) const

        {

            return {this->t_base::operator[](i), this->RowSize(i)};

        }


        DNDS_DEVICE_CALLABLE index BatchSize(index i)

        {

            return this->operator[](i).Size();

        }


        DNDS_DEVICE_CALLABLE t_map operator()(index i, rowsize j)

        {

            return this->operator[](i)[j];

        }


        DNDS_DEVICE_CALLABLE t_map_const operator()(index i, rowsize j) const

        {

            return this->operator[](i)[j];

        }


    };


}

Defines.hpp
Core type aliases, constants, and metaprogramming utilities for the DNDS framework.

DNDS_DEVICE_TRIVIAL_COPY_DEFINE
#define DNDS_DEVICE_TRIVIAL_COPY_DEFINE(T, T_Self)
Definition Defines.hpp:83

DNDS_DEVICE_CALLABLE
#define DNDS_DEVICE_CALLABLE
Definition Defines.hpp:76

DNDS_ROWSIZE_MAX
#define DNDS_ROWSIZE_MAX
Definition Defines.hpp:118

DeviceStorage.hpp
Device memory abstraction layer with backend-specific storage and factory creation.

DNDS_assert
#define DNDS_assert(expr)
Debug-only assertion (compiled out when DNDS_NDEBUG is defined). Prints the expression + file/line + ...
Definition Errors.hpp:108

DNDS::ArrayDeviceView
Non-owning device-callable view of an Array, specialised per DeviceBackend.
Definition DeviceView.hpp:40

DNDS::ArrayEigenMatrixBatchDeviceView
Definition ArrayEigenMatrixBatch_DeviceView.hpp:188

DNDS::ArrayEigenMatrixBatchDeviceView::operator[]
DNDS_DEVICE_CALLABLE MatrixBatch< real_T > operator[](index i)
Definition ArrayEigenMatrixBatch_DeviceView.hpp:203

DNDS::ArrayEigenMatrixBatchDeviceView::t_matrix
typename MatrixBatch< real_T >::t_matrix t_matrix
Definition ArrayEigenMatrixBatch_DeviceView.hpp:193

DNDS::ArrayEigenMatrixBatchDeviceView::operator[]
DNDS_DEVICE_CALLABLE MatrixBatch< const real_T > operator[](index i) const
Definition ArrayEigenMatrixBatch_DeviceView.hpp:208

DNDS::ArrayEigenMatrixBatchDeviceView::t_map_const
typename MatrixBatch< real_T >::t_map_const t_map_const
Definition ArrayEigenMatrixBatch_DeviceView.hpp:195

DNDS::ArrayEigenMatrixBatchDeviceView::operator()
DNDS_DEVICE_CALLABLE t_map_const operator()(index i, rowsize j) const
Definition ArrayEigenMatrixBatch_DeviceView.hpp:223

DNDS::ArrayEigenMatrixBatchDeviceView::t_map
typename MatrixBatch< real_T >::t_map t_map
Definition ArrayEigenMatrixBatch_DeviceView.hpp:194

DNDS::ArrayEigenMatrixBatchDeviceView::BatchSize
DNDS_DEVICE_CALLABLE index BatchSize(index i)
Definition ArrayEigenMatrixBatch_DeviceView.hpp:213

DNDS::ArrayEigenMatrixBatchDeviceView::operator()
DNDS_DEVICE_CALLABLE t_map operator()(index i, rowsize j)
Definition ArrayEigenMatrixBatch_DeviceView.hpp:218

DNDS::ArrayView::operator[]
T * operator[](index iRow)
Raw row pointer. iRow == Size() is allowed for past-the-end queries (useful for computing buffer end ...
Definition ArrayBasic.hpp:520

DNDS::ArrayView::RowSize
DNDS_DEVICE_CALLABLE rowsize RowSize() const
Uniform row width for fixed layouts (asserts otherwise).
Definition ArrayBasic.hpp:328

DNDS::MatrixBatch
Packed variable-shape matrix-batch layout inside a flat buffer.
Definition ArrayEigenMatrixBatch_DeviceView.hpp:36

DNDS::MatrixBatch::CompressIn
void CompressIn(const std::vector< t_matrices_elem > &matrices)
Definition ArrayEigenMatrixBatch_DeviceView.hpp:145

DNDS::MatrixBatch::getOffset
DNDS_DEVICE_CALLABLE uint32_t getOffset(rowsize k) const
Definition ArrayEigenMatrixBatch_DeviceView.hpp:120

DNDS::MatrixBatch::getNCol
DNDS_DEVICE_CALLABLE uint16_t getNCol(rowsize k) const
Definition ArrayEigenMatrixBatch_DeviceView.hpp:114

DNDS::MatrixBatch::t_matrix
Eigen::Matrix< std::remove_cv_t< real_T >, Eigen::Dynamic, Eigen::Dynamic > t_matrix
Definition ArrayEigenMatrixBatch_DeviceView.hpp:63

DNDS::MatrixBatch::getBufSize
static rowsize getBufSize(const std::vector< t_matrices_elem > &matrices)
Definition ArrayEigenMatrixBatch_DeviceView.hpp:71

DNDS::MatrixBatch::Size
DNDS_DEVICE_CALLABLE uint64_t & Size() const
Definition ArrayEigenMatrixBatch_DeviceView.hpp:102

DNDS::MatrixBatch::t_map_const
Eigen::Map< const t_matrix, Eigen::Unaligned > t_map_const
Definition ArrayEigenMatrixBatch_DeviceView.hpp:64

DNDS::MatrixBatch::setOffset
DNDS_DEVICE_CALLABLE void setOffset(rowsize k, uint32_t v)
Definition ArrayEigenMatrixBatch_DeviceView.hpp:138

DNDS::MatrixBatch::MatrixBatch
DNDS_DEVICE_CALLABLE MatrixBatch(real_T *n_buf, rowsize new_size)
Definition ArrayEigenMatrixBatch_DeviceView.hpp:98

DNDS::MatrixBatch::getNRow
DNDS_DEVICE_CALLABLE uint16_t getNRow(rowsize k) const
Definition ArrayEigenMatrixBatch_DeviceView.hpp:108

DNDS::MatrixBatch::operator[]
DNDS_DEVICE_CALLABLE t_map_const operator[](rowsize k) const
Definition ArrayEigenMatrixBatch_DeviceView.hpp:176

DNDS::MatrixBatch::t_map
std::conditional_t< std::is_const_v< real_T >, t_map_const, Eigen::Map< t_matrix, Eigen::Unaligned > > t_map
Definition ArrayEigenMatrixBatch_DeviceView.hpp:68

DNDS::MatrixBatch::setNCol
DNDS_DEVICE_CALLABLE void setNCol(rowsize k, uint16_t v)
Definition ArrayEigenMatrixBatch_DeviceView.hpp:132

DNDS::MatrixBatch::setNRow
DNDS_DEVICE_CALLABLE void setNRow(rowsize k, uint16_t v)
Definition ArrayEigenMatrixBatch_DeviceView.hpp:126

DNDS::MatrixBatch::operator[]
DNDS_DEVICE_CALLABLE t_map operator[](rowsize k)
Definition ArrayEigenMatrixBatch_DeviceView.hpp:166

DNDS
the host side operators are provided as implemented
Definition BenchmarkFiniteVolume.cpp:7

DNDS::rowsize
int32_t rowsize
Row-width / per-row element-count type (signed 32-bit).
Definition Defines.hpp:109

DNDS::index
int64_t index
Global row / DOF index type (signed 64-bit; handles multi-billion-cell meshes).
Definition Defines.hpp:107

DNDS::real
double real
Canonical floating-point scalar used throughout DNDSR (double precision).
Definition Defines.hpp:105

DNDS::MatrixBatch::UInt16QuadIn64
Definition ArrayEigenMatrixBatch_DeviceView.hpp:49

DNDS::MatrixBatch::UInt16QuadIn64::setA
DNDS_DEVICE_CALLABLE void setA(uint16_t v)
Definition ArrayEigenMatrixBatch_DeviceView.hpp:56

DNDS::MatrixBatch::UInt16QuadIn64::setD
DNDS_DEVICE_CALLABLE void setD(uint16_t v)
Definition ArrayEigenMatrixBatch_DeviceView.hpp:59

DNDS::MatrixBatch::UInt16QuadIn64::data
uint64_t data
Definition ArrayEigenMatrixBatch_DeviceView.hpp:50

DNDS::MatrixBatch::UInt16QuadIn64::setC
DNDS_DEVICE_CALLABLE void setC(uint16_t v)
Definition ArrayEigenMatrixBatch_DeviceView.hpp:58

DNDS::MatrixBatch::UInt16QuadIn64::getC
DNDS_DEVICE_CALLABLE uint16_t getC() const
Definition ArrayEigenMatrixBatch_DeviceView.hpp:53

DNDS::MatrixBatch::UInt16QuadIn64::getB
DNDS_DEVICE_CALLABLE uint16_t getB() const
Definition ArrayEigenMatrixBatch_DeviceView.hpp:52

DNDS::MatrixBatch::UInt16QuadIn64::getA
DNDS_DEVICE_CALLABLE uint16_t getA() const
Definition ArrayEigenMatrixBatch_DeviceView.hpp:51

DNDS::MatrixBatch::UInt16QuadIn64::setB
DNDS_DEVICE_CALLABLE void setB(uint16_t v)
Definition ArrayEigenMatrixBatch_DeviceView.hpp:57

DNDS::MatrixBatch::UInt16QuadIn64::getD
DNDS_DEVICE_CALLABLE uint16_t getD() const
Definition ArrayEigenMatrixBatch_DeviceView.hpp:54

DNDS::MatrixBatch::UInt32PairIn64
Definition ArrayEigenMatrixBatch_DeviceView.hpp:39

DNDS::MatrixBatch::UInt32PairIn64::data
uint64_t data
Definition ArrayEigenMatrixBatch_DeviceView.hpp:40

DNDS::MatrixBatch::UInt32PairIn64::getM
DNDS_DEVICE_CALLABLE uint32_t getM() const
Definition ArrayEigenMatrixBatch_DeviceView.hpp:41

DNDS::MatrixBatch::UInt32PairIn64::setN
DNDS_DEVICE_CALLABLE void setN(uint32_t v)
Definition ArrayEigenMatrixBatch_DeviceView.hpp:44

DNDS::MatrixBatch::UInt32PairIn64::getN
DNDS_DEVICE_CALLABLE uint32_t getN() const
Definition ArrayEigenMatrixBatch_DeviceView.hpp:42

DNDS::MatrixBatch::UInt32PairIn64::setM
DNDS_DEVICE_CALLABLE void setM(uint32_t v)
Definition ArrayEigenMatrixBatch_DeviceView.hpp:43

v
Eigen::Matrix< real, 5, 1 > v
Definition test_ArrayDOF.cpp:468