DNDSR/doxygen/EulerP__Evaluator__impl_8cpp_source.html

/** @file EulerP_Evaluator_impl.cpp

 *  @brief Host-backend explicit specializations of Evaluator_impl kernel methods.

 *

 *  Provides the DeviceBackend::Host specialization for each Evaluator_impl static method.

 *  Each method contains an OpenMP-parallelized loop that calls the corresponding

 *  device-callable kernel function from EulerP_Evaluator_impl_common.hxx.

 *

 *  For the CUDA backend specializations, see the separate CUDA compilation unit.

 */

#include "DNDS/Defines.hpp"

#include "DNDS/Device/DeviceStorage.hpp"

#include "EulerP/EulerP.hpp"

#include "EulerP_Evaluator_impl.hpp"

#include "EulerP_Evaluator_impl_common.hxx"


namespace DNDS::EulerP

{

    static constexpr DeviceBackend B = DeviceBackend::Host;


    /**

     * @brief Host specialization: Green-Gauss gradient reconstruction.

     *

     * First loop (serial): generates boundary ghost values for all boundary faces.

     * Second loop (OpenMP parallel): computes the Green-Gauss cell gradient for all owned cells.

     */

    template <>


    void Evaluator_impl<B>::RecGradient_GGRec(RecGradient_Arg &arg)

    {

        using namespace Geom;


        DNDS_EULERP_IMPL_ARG_GET_REF(self_view)


        DNDS_EULERP_IMPL_ARG_GET_REF_PORTABLE(u)

        DNDS_EULERP_IMPL_ARG_GET_REF_PORTABLE(uGrad)

        DNDS_EULERP_IMPL_ARG_GET_REF_PORTABLE(uScalar)

        DNDS_EULERP_IMPL_ARG_GET_REF_PORTABLE(uScalarGrad)

        DNDS_EULERP_IMPL_ARG_GET_REF_PORTABLE(faceBCBuffer)

        DNDS_EULERP_IMPL_ARG_GET_REF_PORTABLE(faceBCScalarBuffer)


        int nVarsScalar = uScalar.size();

        int nVars = nVarsFlow + nVarsScalar;


        auto &mesh = self_view.fv.mesh;

        auto &fv = self_view.fv;

        auto &bcHandler = self_view.bcHandler;

        auto &phy = self_view.physics;


        DNDS_check_throw(faceBCBuffer.father.data());

        DNDS_check_throw(faceBCBuffer.father.Size() >= mesh.NumFace());


        /*********************** */

        // bc handling

        for (index iBnd = 0; iBnd < mesh.NumBnd(); iBnd++)

        {

            RecGradient_GGRec_Kernel_BndVal(self_view, arg.portable, iBnd, mesh.NumBnd(), nVars, nVarsScalar);

        }


        /*********************** */

        // rec

#if defined(DNDS_DIST_MT_USE_OMP)

#    pragma omp parallel for schedule(runtime)

#endif

        for (index iCell = 0; iCell < mesh.NumCell(); iCell++)

        {

            RecGradient_GGRec_Kernel_GG(self_view, arg.portable, iCell, mesh.NumCell(), nVars, nVarsScalar);

        }

    }


    /**

     * @brief Host specialization: Barth-Jespersen gradient limiter.

     *

     * First loop (OpenMP parallel): applies the flow-variable limiter to all owned cells.

     * Second loop (OpenMP parallel, conditional): applies the scalar-variable limiter if

     * there are transported scalars.

     */

    template <>


    void Evaluator_impl<B>::RecGradient_BarthLimiter(RecGradient_Arg &arg)

    {

        using namespace Geom;


        DNDS_EULERP_IMPL_ARG_GET_REF(self_view)

        DNDS_EULERP_IMPL_ARG_GET_REF_PORTABLE(u)

        DNDS_EULERP_IMPL_ARG_GET_REF_PORTABLE(uGrad)

        DNDS_EULERP_IMPL_ARG_GET_REF_PORTABLE(uScalar)

        DNDS_EULERP_IMPL_ARG_GET_REF_PORTABLE(uScalarGrad)


        int nVarsScalar = uScalar.size();

        int nVars = nVarsFlow + nVarsScalar;


        auto &mesh = self_view.fv.mesh;

        auto &fv = self_view.fv;

        auto &bcHandler = self_view.bcHandler;

        auto &phy = self_view.physics;


        /*********************** */

        // limit


#if defined(DNDS_DIST_MT_USE_OMP)

#    pragma omp parallel for schedule(runtime)

#endif

        for (index iCell = 0; iCell < mesh.NumCell(); iCell++)

        {

            RecGradient_BarthLimiter_Kernel_FlowPart(self_view, arg.portable, iCell, mesh.NumCell(), nVars, nVarsScalar);

        }


        // for scalars


        if (nVarsScalar)

#if defined(DNDS_DIST_MT_USE_OMP)

#    pragma omp parallel for schedule(runtime)

#endif

            for (index iCell = 0; iCell < mesh.NumCell(); iCell++)

            {

                RecGradient_BarthLimiter_Kernel_ScalarPart(self_view, arg.portable, iCell, mesh.NumCell(), nVars, nVarsScalar);

            }

    }


    /**

     * @brief Host specialization: conservative-to-primitive conversion with viscosity.

     *

     * OpenMP-parallel loop over all points in the u array, calling Cons2PrimMu_Kernel

     * for each cell.

     */

    template <>


    void Evaluator_impl<B>::Cons2PrimMu(Cons2PrimMu_Arg &arg)

    {

        using namespace Geom;


        DNDS_EULERP_IMPL_ARG_GET_REF(self_view)

        DNDS_EULERP_IMPL_ARG_GET_REF_PORTABLE(u)

        DNDS_EULERP_IMPL_ARG_GET_REF_PORTABLE(uScalar)


        int nVarsScalar = uScalar.size();

        int nVars = nVarsFlow + nVarsScalar;


        auto &mesh = self_view.fv.mesh;

        auto &fv = self_view.fv;

        auto &bcHandler = self_view.bcHandler;

        auto &phy = self_view.physics;


#if defined(DNDS_DIST_MT_USE_OMP)

#    pragma omp parallel for schedule(runtime)

#endif

        for (index iPt = 0; iPt < u.Size(); iPt++)

        {

            Cons2PrimMu_Kernel(self_view, arg.portable, iPt, u.Size(), nVars, nVarsScalar);

        }

    }


    /**

     * @brief Host specialization: conservative-to-primitive conversion (no gradients/viscosity).

     *

     * OpenMP-parallel loop over all points in the u array, calling Cons2Prim_Kernel

     * for each cell.

     */

    template <>


    void Evaluator_impl<B>::Cons2Prim(Cons2Prim_Arg &arg)

    {

        using namespace Geom;


        DNDS_EULERP_IMPL_ARG_GET_REF(self_view)

        DNDS_EULERP_IMPL_ARG_GET_REF_PORTABLE(u)

        DNDS_EULERP_IMPL_ARG_GET_REF_PORTABLE(uScalar)


        int nVarsScalar = uScalar.size();

        int nVars = nVarsFlow + nVarsScalar;


        auto &mesh = self_view.fv.mesh;

        auto &fv = self_view.fv;

        auto &bcHandler = self_view.bcHandler;

        auto &phy = self_view.physics;


#if defined(DNDS_DIST_MT_USE_OMP)

#    pragma omp parallel for schedule(runtime)

#endif

        for (index iPt = 0; iPt < u.Size(); iPt++)

        {

            Cons2Prim_Kernel(self_view, arg.portable, iPt, u.Size(), nVars, nVarsScalar);

        }

    }


    /**

     * @brief Host specialization: per-face eigenvalue estimation.

     *

     * OpenMP-parallel loop over all processor-local faces, calling

     * EstEigenDt_GetFaceLam_Kernel for each face.

     */

    template <>


    void Evaluator_impl<B>::EstEigenDt_GetFaceLam(EstEigenDt_Arg &arg)

    {

        using namespace Geom;


        DNDS_EULERP_IMPL_ARG_GET_REF(self)

        DNDS_EULERP_IMPL_ARG_GET_REF(self_view)


        DNDS_EULERP_IMPL_ARG_GET_REF_PORTABLE(u)

        DNDS_EULERP_IMPL_ARG_GET_REF_PORTABLE(muCell)

        DNDS_EULERP_IMPL_ARG_GET_REF_PORTABLE(aCell)

        DNDS_EULERP_IMPL_ARG_GET_REF_PORTABLE(faceLamEst)

        DNDS_EULERP_IMPL_ARG_GET_REF_PORTABLE(faceLamVisEst)

        DNDS_EULERP_IMPL_ARG_GET_REF_PORTABLE(deltaLamFace)


        auto &mesh = self_view.fv.mesh;

        auto &fv = self_view.fv;

        auto &bcHandler = self_view.bcHandler;

        auto &phy = self_view.physics;


        int nVarsScalar = 0; // no uScalar here

        int nVars = nVarsFlow + nVarsScalar;


#if defined(DNDS_DIST_MT_USE_OMP)

#    pragma omp parallel for schedule(runtime)

#endif

        for (index iFace = 0; iFace < mesh.NumFaceProc(); iFace++)

        {

            EstEigenDt_GetFaceLam_Kernel(self_view, arg.portable, iFace, mesh.NumFaceProc(), nVars, nVarsScalar);

        }

    }


    /**

     * @brief Host specialization: face eigenvalue accumulation to cell time steps.

     *

     * OpenMP-parallel loop over all owned cells, calling

     * EstEigenDt_FaceLam2CellDt_Kernel for each cell.

     */

    template <>


    void Evaluator_impl<B>::EstEigenDt_FaceLam2CellDt(EstEigenDt_Arg &arg)

    {


        DNDS_EULERP_IMPL_ARG_GET_REF(self)

        DNDS_EULERP_IMPL_ARG_GET_REF(self_view)


        auto &mesh = self_view.fv.mesh;

        auto &fv = self_view.fv;

        auto &bcHandler = self_view.bcHandler;

        auto &phy = self_view.physics;


        int nVarsScalar = 0; // no uScalar here

        int nVars = nVarsFlow + nVarsScalar;

#if defined(DNDS_DIST_MT_USE_OMP)

#    pragma omp parallel for schedule(runtime)

#endif

        for (index iCell = 0; iCell < mesh.NumCell(); iCell++)

        {

            EstEigenDt_FaceLam2CellDt_Kernel(self_view, arg.portable, iCell, mesh.NumCell(), nVars, nVarsScalar);

        }

    }


    /**

     * @brief Host specialization: 2nd-order face value reconstruction.

     *

     * OpenMP-parallel loop over all processor-local faces, calling

     * RecFace2nd_Kernel for each face.

     */

    template <>


    void Evaluator_impl<B>::RecFace2nd(RecFace2nd_Arg &arg)

    {

        using namespace Geom;

        DNDS_EULERP_IMPL_ARG_GET_REF(self)

        DNDS_EULERP_IMPL_ARG_GET_REF(self_view)


        DNDS_EULERP_IMPL_ARG_GET_REF_PORTABLE(uScalar)


        auto &mesh = self_view.fv.mesh;

        auto &fv = self_view.fv;

        auto &bcHandler = self_view.bcHandler;

        auto &phy = self_view.physics;


        int nVarsScalar = uScalar.size();

        int nVars = nVarsScalar + nVarsFlow;


#if defined(DNDS_DIST_MT_USE_OMP)

#    pragma omp parallel for schedule(runtime)

#endif

        for (index iFace = 0; iFace < mesh.NumFaceProc(); iFace++)

        {

            RecFace2nd_Kernel(self_view, arg.portable, iFace, mesh.NumFaceProc(), nVars, nVarsScalar);

        }

    }


    /**

     * @brief Host specialization: 2nd-order Roe flux evaluation and face-to-cell RHS scatter.

     *

     * First loop (OpenMP parallel): computes per-face numerical flux via Flux2nd_Kernel_FluxFace.

     * Second loop (OpenMP parallel): scatters face fluxes to cell RHS via Flux2nd_Kernel_Face2Cell.

     */

    template <>


    void Evaluator_impl<B>::Flux2nd(Flux2nd_Arg &arg)

    {

        using namespace Geom;

        DNDS_EULERP_IMPL_ARG_GET_REF(self)

        DNDS_EULERP_IMPL_ARG_GET_REF(self_view)


        DNDS_EULERP_IMPL_ARG_GET_REF_PORTABLE(uScalarFL)


        auto &mesh = self_view.fv.mesh;

        auto &fv = self_view.fv;

        auto &bcHandler = self_view.bcHandler;

        auto &phy = self_view.physics;


        int nVarsScalar = uScalarFL.size();

        int nVars = nVarsScalar + nVarsFlow;


#if defined(DNDS_DIST_MT_USE_OMP)

#    pragma omp parallel for schedule(runtime)

#endif

        for (index iFace = 0; iFace < mesh.NumFaceProc(); iFace++)

        {

            Flux2nd_Kernel_FluxFace(self_view, arg.portable, iFace, mesh.NumFaceProc(), nVars, nVarsScalar);

        }


#if defined(DNDS_DIST_MT_USE_OMP)

#    pragma omp parallel for schedule(runtime)

#endif

        for (index iCell = 0; iCell < mesh.NumCell(); iCell++)

        {

            Flux2nd_Kernel_Face2Cell(self_view, arg.portable, iCell, mesh.NumCell(), nVars, nVarsScalar);

        }

    }


}

Defines.hpp
Core type aliases, constants, and metaprogramming utilities for the DNDS framework.

DeviceStorage.hpp
Device memory abstraction layer with backend-specific storage and factory creation.

DNDS_check_throw
#define DNDS_check_throw(expr)
Runtime check active in both debug and release builds. Throws std::runtime_error if expr evaluates to...
Definition Errors.hpp:93

EulerP.hpp
Core type definitions and utilities for the EulerP alternative Navier-Stokes evaluator module.

EulerP_Evaluator_impl.hpp
Backend-specific implementation layer for EulerP Evaluator kernel dispatch.

DNDS_EULERP_IMPL_ARG_GET_REF_PORTABLE
#define DNDS_EULERP_IMPL_ARG_GET_REF_PORTABLE(member)
Definition EulerP_Evaluator_impl.hpp:25

DNDS_EULERP_IMPL_ARG_GET_REF
#define DNDS_EULERP_IMPL_ARG_GET_REF(member)
Definition EulerP_Evaluator_impl.hpp:24

EulerP_Evaluator_impl_common.hxx
Shared device-callable kernel implementations for the EulerP Evaluator.

DNDS::EulerP
Namespace for the EulerP alternative evaluator module with GPU support.
Definition EulerP.hpp:29

DNDS::EulerP::EstEigenDt_FaceLam2CellDt_Kernel
DNDS_DEVICE void EstEigenDt_FaceLam2CellDt_Kernel(EvaluatorDeviceView< B > &self_view, typename Evaluator_impl< B >::EstEigenDt_Arg::Portable &arg, index iCell, index iCellEnd, int nVars, int nVarsScalar)
Per-cell kernel converting face eigenvalues to a local CFL time step.
Definition EulerP_Evaluator_impl_common.hxx:821

DNDS::EulerP::Flux2nd_Kernel_FluxFace
DNDS_DEVICE void Flux2nd_Kernel_FluxFace(EvaluatorDeviceView< B > &self_view, typename Evaluator_impl< B >::Flux2nd_Arg::Portable &arg, index iFace, index iFaceEnd, int nVars, int nVarsScalar)
2nd-order Roe inviscid flux computation kernel (per-face).
Definition EulerP_Evaluator_impl_common.hxx:1035

DNDS::EulerP::RecGradient_BarthLimiter_Kernel_FlowPart
DNDS_DEVICE void RecGradient_BarthLimiter_Kernel_FlowPart(EvaluatorDeviceView< B > &self_view, typename Evaluator_impl< B >::RecGradient_Arg::Portable &arg, index iCell, index iCellEnd, int nVars, int nVarsScalar)
Barth-Jespersen gradient limiter kernel for flow variables (per-cell).
Definition EulerP_Evaluator_impl_common.hxx:252

DNDS::EulerP::RecFace2nd_Kernel
DNDS_DEVICE void RecFace2nd_Kernel(EvaluatorDeviceView< B > &self_view, typename Evaluator_impl< B >::RecFace2nd_Arg::Portable &arg, index iFace, index iFaceEnd, int nVars, int nVarsScalar)
2nd-order face value reconstruction kernel (per-face).
Definition EulerP_Evaluator_impl_common.hxx:886

DNDS::EulerP::RecGradient_GGRec_Kernel_GG
DNDS_DEVICE void RecGradient_GGRec_Kernel_GG(EvaluatorDeviceView< B > &self_view, typename Evaluator_impl< B >::RecGradient_Arg::Portable &arg, index iCell, index iCellEnd, int nVars, int nVarsScalar)
Green-Gauss gradient reconstruction kernel (per-cell).
Definition EulerP_Evaluator_impl_common.hxx:127

DNDS::EulerP::Cons2Prim_Kernel
DNDS_DEVICE void Cons2Prim_Kernel(EvaluatorDeviceView< B > &self_view, typename Evaluator_impl< B >::Cons2Prim_Arg::Portable &arg, index iPt, index iPtEnd, int nVars, int nVarsScalar)
Conservative-to-primitive conversion without gradient transformation or viscosity (per-cell).
Definition EulerP_Evaluator_impl_common.hxx:633

DNDS::EulerP::RecGradient_BarthLimiter_Kernel_ScalarPart
DNDS_DEVICE void RecGradient_BarthLimiter_Kernel_ScalarPart(EvaluatorDeviceView< B > &self_view, typename Evaluator_impl< B >::RecGradient_Arg::Portable &arg, index iCell, index iCellEnd, int nVars, int nVarsScalar)
Barth-Jespersen gradient limiter kernel for transported scalar variables (per-cell).
Definition EulerP_Evaluator_impl_common.hxx:400

DNDS::EulerP::Flux2nd_Kernel_Face2Cell
DNDS_DEVICE void Flux2nd_Kernel_Face2Cell(EvaluatorDeviceView< B > &self_view, typename Evaluator_impl< B >::Flux2nd_Arg::Portable &arg, index iCell, index iCellEnd, int nVars, int nVarsScalar)
Scatters face fluxes to cell RHS residual (per-cell).
Definition EulerP_Evaluator_impl_common.hxx:1215

DNDS::EulerP::RecGradient_GGRec_Kernel_BndVal
DNDS_DEVICE void RecGradient_GGRec_Kernel_BndVal(EvaluatorDeviceView< B > &self_view, typename Evaluator_impl< B >::RecGradient_Arg::Portable &arg, index iBnd, index iBndEnd, int nVars, int nVarsScalar)
Generates boundary ghost values for Green-Gauss gradient reconstruction.
Definition EulerP_Evaluator_impl_common.hxx:52

DNDS::EulerP::EstEigenDt_GetFaceLam_Kernel
DNDS_DEVICE void EstEigenDt_GetFaceLam_Kernel(EvaluatorDeviceView< B > &self_view, typename Evaluator_impl< B >::EstEigenDt_Arg::Portable &arg, index iFace, index iFaceEnd, int nVars, int nVarsScalar)
Per-face eigenvalue estimation kernel for time-step computation.
Definition EulerP_Evaluator_impl_common.hxx:732

DNDS::EulerP::Cons2PrimMu_Kernel
DNDS_DEVICE void Cons2PrimMu_Kernel(EvaluatorDeviceView< B > &self_view, typename Evaluator_impl< B >::Cons2PrimMu_Arg::Portable &arg, index iPt, index iPtEnd, int nVars, int nVarsScalar)
Conservative-to-primitive conversion with gradient transformation and viscosity (per-cell).
Definition EulerP_Evaluator_impl_common.hxx:493

DNDS::DeviceBackend
DeviceBackend
Enumerates the backends a DeviceStorage / Array can live on.
Definition DeviceStorage.hpp:28

DNDS::DeviceBackend::Host
@ Host
Plain CPU memory.

DNDS::index
int64_t index
Global row / DOF index type (signed 64-bit; handles multi-billion-cell meshes).
Definition Defines.hpp:112

DNDS::EulerP::Evaluator_impl::Cons2PrimMu_Arg
Device-side argument struct for conservative-to-primitive + viscosity kernel.
Definition EulerP_Evaluator_impl.hpp:151

DNDS::EulerP::Evaluator_impl::Cons2PrimMu_Arg::portable
struct DNDS::EulerP::Evaluator_impl::Cons2PrimMu_Arg::Portable portable

DNDS::EulerP::Evaluator_impl::Cons2Prim_Arg
Device-side argument struct for conservative-to-primitive conversion (no gradients/viscosity).
Definition EulerP_Evaluator_impl.hpp:214

DNDS::EulerP::Evaluator_impl::Cons2Prim_Arg::portable
struct DNDS::EulerP::Evaluator_impl::Cons2Prim_Arg::Portable portable

DNDS::EulerP::Evaluator_impl::EstEigenDt_Arg
Device-side argument struct for eigenvalue estimation and time-step computation.
Definition EulerP_Evaluator_impl.hpp:263

DNDS::EulerP::Evaluator_impl::EstEigenDt_Arg::portable
struct DNDS::EulerP::Evaluator_impl::EstEigenDt_Arg::Portable portable

DNDS::EulerP::Evaluator_impl::Flux2nd_Arg
Device-side argument struct for 2nd-order flux evaluation and RHS accumulation.
Definition EulerP_Evaluator_impl.hpp:371

DNDS::EulerP::Evaluator_impl::Flux2nd_Arg::portable
struct DNDS::EulerP::Evaluator_impl::Flux2nd_Arg::Portable portable

DNDS::EulerP::Evaluator_impl::RecFace2nd_Arg
Device-side argument struct for 2nd-order face value reconstruction.
Definition EulerP_Evaluator_impl.hpp:312

DNDS::EulerP::Evaluator_impl::RecFace2nd_Arg::portable
struct DNDS::EulerP::Evaluator_impl::RecFace2nd_Arg::Portable portable

DNDS::EulerP::Evaluator_impl::RecGradient_Arg
Device-side argument struct for gradient reconstruction kernels.
Definition EulerP_Evaluator_impl.hpp:91

DNDS::EulerP::Evaluator_impl::RecGradient_Arg::portable
struct DNDS::EulerP::Evaluator_impl::RecGradient_Arg::Portable portable

DNDS::EulerP::Evaluator_impl::Flux2nd
static void Flux2nd(Flux2nd_Arg &arg)
Evaluates 2nd-order Roe flux per face and scatters to cell RHS.

DNDS::EulerP::Evaluator_impl::Cons2PrimMu
static void Cons2PrimMu(Cons2PrimMu_Arg &arg)
Executes conservative-to-primitive conversion with viscosity computation.

DNDS::EulerP::Evaluator_impl::EstEigenDt_GetFaceLam
static void EstEigenDt_GetFaceLam(EstEigenDt_Arg &arg)
First pass: computes per-face eigenvalue estimates from cell states.

DNDS::EulerP::Evaluator_impl::Cons2Prim
static void Cons2Prim(Cons2Prim_Arg &arg)
Executes conservative-to-primitive conversion (no gradients/viscosity).

DNDS::EulerP::Evaluator_impl::EstEigenDt_FaceLam2CellDt
static void EstEigenDt_FaceLam2CellDt(EstEigenDt_Arg &arg)
Second pass: accumulates face eigenvalues to cells and computes local dt.

DNDS::EulerP::Evaluator_impl::RecFace2nd
static void RecFace2nd(RecFace2nd_Arg &arg)
Executes 2nd-order face value reconstruction from cell-centered data.

DNDS::EulerP::Evaluator_impl::RecGradient_BarthLimiter
static void RecGradient_BarthLimiter(RecGradient_Arg &arg)
Barth-Jespersen gradient limiter applied to reconstructed gradients.

DNDS::EulerP::Evaluator_impl::RecGradient_GGRec
static void RecGradient_GGRec(RecGradient_Arg &arg)
Green-Gauss gradient reconstruction: boundary ghost values + cell gradient computation.

mesh
DistributedHex3D mesh
Definition test_MeshConnectivity_Interpolate.cpp:929