4.6/det_8cpp_source.html

 // Copyright (c) 2010-2023, Lawrence Livermore National Security, LLC. Produced
 // at the Lawrence Livermore National Laboratory. All Rights reserved. See files
 // LICENSE and NOTICE for details. LLNL-CODE-806117.
 //
 // This file is part of the MFEM library. For more information and source code
 // availability visit https://mfem.org.
 //
 // MFEM is free software; you can redistribute it and/or modify it under the
 // terms of the BSD-3 license. We welcome feedback and contributions, see file
 // CONTRIBUTING.md for details.

 #include "../quadinterpolator.hpp"
 #include "../../general/forall.hpp"
 #include "../../linalg/dtensor.hpp"
 #include "../../fem/kernels.hpp"
 #include "../../linalg/kernels.hpp"

 using namespace mfem;

 namespace mfem
 {

 namespace internal
 {

 namespace quadrature_interpolator
 {

 static void Det1D(const int NE,
                   const double *g,
                   const double *x,
                   double *y,
                   const int d1d,
                   const int q1d)
 {
    const auto G = Reshape(g, q1d, d1d);
    const auto X = Reshape(x, d1d, NE);

    auto Y = Reshape(y, q1d, NE);

    mfem::forall(NE, [=] MFEM_HOST_DEVICE (int e)
    {
       for (int q = 0; q < q1d; q++)
       {
          double u = 0.0;
          for (int d = 0; d < d1d; d++)
          {
             u += G(q, d) * X(d, e);
          }
          Y(q, e) = u;
       }
    });
 }

 template<int T_D1D = 0, int T_Q1D = 0>
 static void Det2D(const int NE,
                   const double *b,
                   const double *g,
                   const double *x,
                   double *y,
                   const int vdim = 1,
                   const int d1d = 0,
                   const int q1d = 0)
 {
    constexpr int DIM = 2;
    static constexpr int NBZ = 1;

    const int D1D = T_D1D ? T_D1D : d1d;
    const int Q1D = T_Q1D ? T_Q1D : q1d;

    const auto B = Reshape(b, Q1D, D1D);
    const auto G = Reshape(g, Q1D, D1D);
    const auto X = Reshape(x,  D1D, D1D, DIM, NE);
    auto Y = Reshape(y, Q1D, Q1D, NE);

    mfem::forall_2D_batch(NE, Q1D, Q1D, NBZ, [=] MFEM_HOST_DEVICE (int e)
    {
       constexpr int MQ1 = T_Q1D ? T_Q1D : DofQuadLimits::MAX_Q1D;
       constexpr int MD1 = T_D1D ? T_D1D : DofQuadLimits::MAX_D1D;
       const int D1D = T_D1D ? T_D1D : d1d;
       const int Q1D = T_Q1D ? T_Q1D : q1d;

       MFEM_SHARED double BG[2][MQ1*MD1];
       MFEM_SHARED double XY[2][NBZ][MD1*MD1];
       MFEM_SHARED double DQ[4][NBZ][MD1*MQ1];
       MFEM_SHARED double QQ[4][NBZ][MQ1*MQ1];

       kernels::internal::LoadX<MD1,NBZ>(e,D1D,X,XY);
       kernels::internal::LoadBG<MD1,MQ1>(D1D,Q1D,B,G,BG);

       kernels::internal::GradX<MD1,MQ1,NBZ>(D1D,Q1D,BG,XY,DQ);
       kernels::internal::GradY<MD1,MQ1,NBZ>(D1D,Q1D,BG,DQ,QQ);

       MFEM_FOREACH_THREAD(qy,y,Q1D)
       {
          MFEM_FOREACH_THREAD(qx,x,Q1D)
          {
             double J[4];
             kernels::internal::PullGrad<MQ1,NBZ>(Q1D,qx,qy,QQ,J);
             Y(qx,qy,e) = kernels::Det<2>(J);
          }
       }
    });
 }

 template<int T_D1D = 0, int T_Q1D = 0, bool SMEM = true>
 static void Det3D(const int NE,
                   const double *b,
                   const double *g,
                   const double *x,
                   double *y,
                   const int vdim = 1,
                   const int d1d = 0,
                   const int q1d = 0,
                   Vector *d_buff = nullptr) // used only with SMEM = false
 {
    constexpr int DIM = 3;
    static constexpr int GRID = SMEM ? 0 : 128;

    const int D1D = T_D1D ? T_D1D : d1d;
    const int Q1D = T_Q1D ? T_Q1D : q1d;

    const auto B = Reshape(b, Q1D, D1D);
    const auto G = Reshape(g, Q1D, D1D);
    const auto X = Reshape(x, D1D, D1D, D1D, DIM, NE);
    auto Y = Reshape(y, Q1D, Q1D, Q1D, NE);

    double *GM = nullptr;
    if (!SMEM)
    {
       const DeviceDofQuadLimits &limits = DeviceDofQuadLimits::Get();
       const int max_q1d = T_Q1D ? T_Q1D : limits.MAX_D1D;
       const int max_d1d = T_D1D ? T_D1D : limits.MAX_Q1D;
       const int max_qd = std::max(max_q1d, max_d1d);
       const int mem_size = max_qd * max_qd * max_qd * 9;
       d_buff->SetSize(2*mem_size*GRID);
       GM = d_buff->Write();
    }

    mfem::forall_3D_grid(NE, Q1D, Q1D, Q1D, GRID, [=] MFEM_HOST_DEVICE (int e)
    {
       static constexpr int MQ1 = T_Q1D ? T_Q1D :
                                  (SMEM ? DofQuadLimits::MAX_DET_1D : DofQuadLimits::MAX_D1D);
       static constexpr int MD1 = T_D1D ? T_D1D :
                                  (SMEM ? DofQuadLimits::MAX_DET_1D : DofQuadLimits::MAX_Q1D);
       static constexpr int MDQ = MQ1 > MD1 ? MQ1 : MD1;
       static constexpr int MSZ = MDQ * MDQ * MDQ * 9;

       const int bid = MFEM_BLOCK_ID(x);
       MFEM_SHARED double BG[2][MQ1*MD1];
       MFEM_SHARED double SM0[SMEM?MSZ:1];
       MFEM_SHARED double SM1[SMEM?MSZ:1];
       double *lm0 = SMEM ? SM0 : GM + MSZ*bid;
       double *lm1 = SMEM ? SM1 : GM + MSZ*(GRID+bid);
       double (*DDD)[MD1*MD1*MD1] = (double (*)[MD1*MD1*MD1]) (lm0);
       double (*DDQ)[MD1*MD1*MQ1] = (double (*)[MD1*MD1*MQ1]) (lm1);
       double (*DQQ)[MD1*MQ1*MQ1] = (double (*)[MD1*MQ1*MQ1]) (lm0);
       double (*QQQ)[MQ1*MQ1*MQ1] = (double (*)[MQ1*MQ1*MQ1]) (lm1);

       kernels::internal::LoadX<MD1>(e,D1D,X,DDD);
       kernels::internal::LoadBG<MD1,MQ1>(D1D,Q1D,B,G,BG);

       kernels::internal::GradX<MD1,MQ1>(D1D,Q1D,BG,DDD,DDQ);
       kernels::internal::GradY<MD1,MQ1>(D1D,Q1D,BG,DDQ,DQQ);
       kernels::internal::GradZ<MD1,MQ1>(D1D,Q1D,BG,DQQ,QQQ);

       MFEM_FOREACH_THREAD(qz,z,Q1D)
       {
          MFEM_FOREACH_THREAD(qy,y,Q1D)
          {
             MFEM_FOREACH_THREAD(qx,x,Q1D)
             {
                double J[9];
                kernels::internal::PullGrad<MQ1>(Q1D, qx,qy,qz, QQQ, J);
                Y(qx,qy,qz,e) = kernels::Det<3>(J);
             }
          }
       }
    });
 }

 // Tensor-product evaluation of quadrature point determinants: dispatch
 // function.
 void TensorDeterminants(const int NE,
                         const int vdim,
                         const DofToQuad &maps,
                         const Vector &e_vec,
                         Vector &q_det,
                         Vector &d_buff)
 {
    if (NE == 0) { return; }
    const int dim = maps.FE->GetDim();
    const int D1D = maps.ndof;
    const int Q1D = maps.nqpt;
    const double *B = maps.B.Read();
    const double *G = maps.G.Read();
    const double *X = e_vec.Read();
    double *Y = q_det.Write();

    const int id = (vdim<<8) | (D1D<<4) | Q1D;

    if (dim == 1)
    {
       MFEM_VERIFY(D1D <= DeviceDofQuadLimits::Get().MAX_D1D,
                   "Orders higher than " << DeviceDofQuadLimits::Get().MAX_D1D-1
                   << " are not supported!");
       MFEM_VERIFY(Q1D <= DeviceDofQuadLimits::Get().MAX_Q1D,
                   "Quadrature rules with more than "
                   << DeviceDofQuadLimits::Get().MAX_Q1D << " 1D points are not supported!");
       Det1D(NE, G, X, Y, D1D, Q1D);
       return;
    }
    if (dim == 2)
    {
       switch (id)
       {
          case 0x222: return Det2D<2,2>(NE,B,G,X,Y);
          case 0x223: return Det2D<2,3>(NE,B,G,X,Y);
          case 0x224: return Det2D<2,4>(NE,B,G,X,Y);
          case 0x226: return Det2D<2,6>(NE,B,G,X,Y);
          case 0x234: return Det2D<3,4>(NE,B,G,X,Y);
          case 0x236: return Det2D<3,6>(NE,B,G,X,Y);
          case 0x244: return Det2D<4,4>(NE,B,G,X,Y);
          case 0x246: return Det2D<4,6>(NE,B,G,X,Y);
          case 0x256: return Det2D<5,6>(NE,B,G,X,Y);
          default:
          {
             const int MD = DeviceDofQuadLimits::Get().MAX_D1D;
             const int MQ = DeviceDofQuadLimits::Get().MAX_Q1D;
             MFEM_VERIFY(D1D <= MD, "Orders higher than " << MD-1
                         << " are not supported!");
             MFEM_VERIFY(Q1D <= MQ, "Quadrature rules with more than "
                         << MQ << " 1D points are not supported!");
             Det2D(NE,B,G,X,Y,vdim,D1D,Q1D);
             return;
          }
       }
    }
    if (dim == 3)
    {
       switch (id)
       {
          case 0x324: return Det3D<2,4>(NE,B,G,X,Y);
          case 0x333: return Det3D<3,3>(NE,B,G,X,Y);
          case 0x335: return Det3D<3,5>(NE,B,G,X,Y);
          case 0x336: return Det3D<3,6>(NE,B,G,X,Y);
          default:
          {
             const int MD = DeviceDofQuadLimits::Get().MAX_DET_1D;
             const int MQ = DeviceDofQuadLimits::Get().MAX_DET_1D;
             // Highest orders that fit in shared memory
             if (D1D <= MD && Q1D <= MQ)
             { return Det3D<0,0,true>(NE,B,G,X,Y,vdim,D1D,Q1D); }
             // Last fall-back will use global memory
             return Det3D<0,0,false>(
                       NE,B,G,X,Y,vdim,D1D,Q1D,&d_buff);
          }
       }
    }
    MFEM_ABORT("Kernel " << std::hex << id << std::dec << " not supported yet");
 }

 } // namespace quadrature_interpolator

 } // namespace internal

 } // namespace mfem
mfem::Array::Read
const T * Read(bool on_dev=true) const
Shortcut for mfem::Read(a.GetMemory(), a.Size(), on_dev).
Definition: array.hpp:307

mfem::DofToQuad::FE
const class FiniteElement * FE
The FiniteElement that created and owns this object.
Definition: fe_base.hpp:141

mfem::DofToQuad::nqpt
int nqpt
Number of quadrature points. When mode is TENSOR, this is the 1D number.
Definition: fe_base.hpp:173

mfem::Vector::Read
virtual const double * Read(bool on_dev=true) const
Shortcut for mfem::Read(vec.GetMemory(), vec.Size(), on_dev).
Definition: vector.hpp:453

mfem::DofToQuad::ndof
int ndof
Number of degrees of freedom = number of basis functions. When mode is TENSOR, this is the 1D number...
Definition: fe_base.hpp:169

DIM
constexpr int DIM
Definition: minimal-surface.cpp:71

mfem::DeviceDofQuadLimits::MAX_Q1D
int MAX_Q1D
Maximum number of 1D quadrature points.
Definition: forall.hpp:113

mfem::DeviceDofQuadLimits::MAX_DET_1D
int MAX_DET_1D
Maximum number of points for determinant computation in QuadratureInterpolator.
Definition: forall.hpp:119

mfem::forall_3D_grid
void forall_3D_grid(int N, int X, int Y, int Z, int G, lambda &&body)
Definition: forall.hpp:769

mfem
Definition: CodeDocumentation.dox:1

mfem::Vector::Write
virtual double * Write(bool on_dev=true)
Shortcut for mfem::Write(vec.GetMemory(), vec.Size(), on_dev).
Definition: vector.hpp:461

b
double b
Definition: lissajous.cpp:42

mfem::forall_2D_batch
void forall_2D_batch(int N, int X, int Y, int BZ, lambda &&body)
Definition: forall.hpp:757

mfem::Det3D
MFEM_HOST_DEVICE double Det3D(DeviceMatrix &J)
Definition: lor_util.hpp:188

mfem::Det2D
MFEM_HOST_DEVICE double Det2D(DeviceMatrix &J)
Definition: lor_util.hpp:183

mfem::DeviceDofQuadLimits::MAX_D1D
int MAX_D1D
Maximum number of 1D nodal points.
Definition: forall.hpp:112

mfem::FiniteElement::GetDim
int GetDim() const
Returns the reference space dimension for the finite element.
Definition: fe_base.hpp:311

mfem::forall
void forall(int N, lambda &&body)
Definition: forall.hpp:742

mfem::DeviceDofQuadLimits
Maximum number of 1D DOFs or quadrature points for the current runtime configuration of the Device (u...
Definition: forall.hpp:110

mfem::DofToQuad
Structure representing the matrices/tensors needed to evaluate (in reference space) the values...
Definition: fe_base.hpp:136

mfem::DeviceDofQuadLimits::Get
static const DeviceDofQuadLimits & Get()
Return a const reference to the DeviceDofQuadLimits singleton.
Definition: forall.hpp:122

mfem::DofToQuad::B
Array< double > B
Basis functions evaluated at quadrature points.
Definition: fe_base.hpp:184

dim
int dim
Definition: ex24.cpp:53

mfem::DofToQuad::G
Array< double > G
Gradients/divergences/curls of basis functions evaluated at quadrature points.
Definition: fe_base.hpp:205

mfem::Vector
Vector data type.
Definition: vector.hpp:58

mfem::u
double u(const Vector &xvec)
Definition: lor_mms.hpp:22

mfem::Reshape
MFEM_HOST_DEVICE DeviceTensor< sizeof...(Dims), T > Reshape(T *ptr, Dims... dims)
Wrap a pointer as a DeviceTensor with automatically deduced template parameters.
Definition: dtensor.hpp:131