html/tmop__pa__h3s__c0_8cpp_source.html

// Copyright (c) 2010-2025, Lawrence Livermore National Security, LLC. Produced

// at the Lawrence Livermore National Laboratory. All Rights reserved. See files

// LICENSE and NOTICE for details. LLNL-CODE-806117.

//

// This file is part of the MFEM library. For more information and source code

// availability visit https://mfem.org.

//

// MFEM is free software; you can redistribute it and/or modify it under the

// terms of the BSD-3 license. We welcome feedback and contributions, see file

// CONTRIBUTING.md for details.


#include "../tmop.hpp"

#include "tmop_pa.hpp"

#include "../linearform.hpp"

#include "../../general/forall.hpp"

#include "../../linalg/kernels.hpp"


namespace mfem

{


MFEM_REGISTER_TMOP_KERNELS(void, SetupGradPA_Kernel_C0_3D,

                           const real_t lim_normal,

                           const Vector &lim_dist,

                           const Vector &c0_,

                           const int NE,

                           const DenseTensor &j_,

                           const Array<real_t> &w_,

                           const Array<real_t> &b_,

                           const Array<real_t> &bld_,

                           const Vector &x0_,

                           const Vector &x1_,

                           Vector &h0_,

                           const bool exp_lim,

                           const int d1d,

                           const int q1d)

{

   constexpr int DIM = 3;

   const int D1D = T_D1D ? T_D1D : d1d;

   const int Q1D = T_Q1D ? T_Q1D : q1d;


   const bool const_c0 = c0_.Size() == 1;

   const auto C0 = const_c0 ?

                   Reshape(c0_.Read(), 1, 1, 1, 1) :

                   Reshape(c0_.Read(), Q1D, Q1D, Q1D, NE);

   const auto LD = Reshape(lim_dist.Read(), D1D, D1D, D1D, NE);

   const auto J = Reshape(j_.Read(), DIM, DIM, Q1D, Q1D, Q1D, NE);

   const auto b = Reshape(b_.Read(), Q1D, D1D);

   const auto bld = Reshape(bld_.Read(), Q1D, D1D);

   const auto W = Reshape(w_.Read(), Q1D, Q1D, Q1D);

   const auto X0 = Reshape(x0_.Read(), D1D, D1D, D1D, DIM, NE);

   const auto X1 = Reshape(x1_.Read(), D1D, D1D, D1D, DIM, NE);


   auto H0 = Reshape(h0_.Write(), DIM, DIM, Q1D, Q1D, Q1D, NE);


   mfem::forall_3D(NE, Q1D, Q1D, Q1D, [=] MFEM_HOST_DEVICE (int e)

   {

      constexpr int DIM = 3;

      const int D1D = T_D1D ? T_D1D : d1d;

      const int Q1D = T_Q1D ? T_Q1D : q1d;

      constexpr int MQ1 = T_Q1D ? T_Q1D : T_MAX;

      constexpr int MD1 = T_D1D ? T_D1D : T_MAX;

      constexpr int MDQ = (MQ1 > MD1) ? MQ1 : MD1;


      MFEM_SHARED real_t B[MQ1*MD1];

      MFEM_SHARED real_t sBLD[MQ1*MD1];

      kernels::internal::LoadB<MD1,MQ1>(D1D,Q1D,bld,sBLD);

      ConstDeviceMatrix BLD(sBLD, D1D, Q1D);


      MFEM_SHARED real_t sm0[MDQ*MDQ*MDQ];

      MFEM_SHARED real_t sm1[MDQ*MDQ*MDQ];

      DeviceCube DDD(sm0, MD1,MD1,MD1);

      DeviceCube DDQ(sm1, MD1,MD1,MQ1);

      DeviceCube DQQ(sm0, MD1,MQ1,MQ1);

      DeviceCube QQQ(sm1, MQ1,MQ1,MQ1);


      MFEM_SHARED real_t DDD0[3][MD1*MD1*MD1];

      MFEM_SHARED real_t DDQ0[3][MD1*MD1*MQ1];

      MFEM_SHARED real_t DQQ0[3][MD1*MQ1*MQ1];

      MFEM_SHARED real_t QQQ0[3][MQ1*MQ1*MQ1];


      MFEM_SHARED real_t DDD1[3][MD1*MD1*MD1];

      MFEM_SHARED real_t DDQ1[3][MD1*MD1*MQ1];

      MFEM_SHARED real_t DQQ1[3][MD1*MQ1*MQ1];

      MFEM_SHARED real_t QQQ1[3][MQ1*MQ1*MQ1];


      kernels::internal::LoadX(e,D1D,LD,DDD);

      kernels::internal::LoadX<MD1>(e,D1D,X0,DDD0);

      kernels::internal::LoadX<MD1>(e,D1D,X1,DDD1);


      kernels::internal::LoadB<MD1,MQ1>(D1D,Q1D,b,B);


      kernels::internal::EvalX(D1D,Q1D,BLD,DDD,DDQ);

      kernels::internal::EvalY(D1D,Q1D,BLD,DDQ,DQQ);

      kernels::internal::EvalZ(D1D,Q1D,BLD,DQQ,QQQ);


      kernels::internal::EvalX<MD1,MQ1>(D1D,Q1D,B,DDD0,DDQ0);

      kernels::internal::EvalY<MD1,MQ1>(D1D,Q1D,B,DDQ0,DQQ0);

      kernels::internal::EvalZ<MD1,MQ1>(D1D,Q1D,B,DQQ0,QQQ0);


      kernels::internal::EvalX<MD1,MQ1>(D1D,Q1D,B,DDD1,DDQ1);

      kernels::internal::EvalY<MD1,MQ1>(D1D,Q1D,B,DDQ1,DQQ1);

      kernels::internal::EvalZ<MD1,MQ1>(D1D,Q1D,B,DQQ1,QQQ1);


      MFEM_FOREACH_THREAD(qz,z,Q1D)

      {

         MFEM_FOREACH_THREAD(qy,y,Q1D)

         {

            MFEM_FOREACH_THREAD(qx,x,Q1D)

            {

               const real_t *Jtr = &J(0,0,qx,qy,qz,e);

               const real_t detJtr = kernels::Det<3>(Jtr);

               const real_t weight = W(qx,qy,qz) * detJtr;

               const real_t coeff0 = const_c0 ? C0(0,0,0,0) : C0(qx,qy,qz,e);

               const real_t weight_m = weight * lim_normal * coeff0;


               real_t D, p0[3], p1[3];

               kernels::internal::PullEval(qx,qy,qz,QQQ,D);

               kernels::internal::PullEval<MQ1>(Q1D,qx,qy,qz,QQQ0,p0);

               kernels::internal::PullEval<MQ1>(Q1D,qx,qy,qz,QQQ1,p1);


               const real_t dist = D; // GetValues, default comp set to 0


               // lim_func->Eval_d2(p1, p0, d_vals(q), grad_grad);


               real_t grad_grad[9];


               if (!exp_lim)

               {

                  // d2.Diag(1.0 / (dist * dist), x.Size());

                  const real_t c = 1.0 / (dist * dist);

                  kernels::Diag<3>(c, grad_grad);

               }

               else

               {

                  real_t tmp[3];

                  kernels::Subtract<3>(1.0, p1, p0, tmp);

                  real_t dsq = kernels::DistanceSquared<3>(p1,p0);

                  real_t dist_squared = dist*dist;

                  real_t dist_squared_squared = dist_squared*dist_squared;

                  real_t f = exp(10.0*((dsq / dist_squared)-1.0));

                  grad_grad[0] = ((400.0*tmp[0]*tmp[0]*f)/dist_squared_squared)+

                                 (20.0*f/dist_squared);

                  grad_grad[1] = (400.0*tmp[0]*tmp[1]*f)/dist_squared_squared;

                  grad_grad[2] = (400.0*tmp[0]*tmp[2]*f)/dist_squared_squared;

                  grad_grad[3] = grad_grad[1];

                  grad_grad[4] = ((400.0*tmp[1]*tmp[1]*f)/dist_squared_squared)+

                                 (20.0*f/dist_squared);

                  grad_grad[5] = (400.0*tmp[1]*tmp[2]*f)/dist_squared_squared;

                  grad_grad[6] = grad_grad[2];

                  grad_grad[7] = grad_grad[5];

                  grad_grad[8] = ((400.0*tmp[2]*tmp[2]*f)/dist_squared_squared)+

                                 (20.0*f/dist_squared);

               }

               ConstDeviceMatrix gg(grad_grad,DIM,DIM);


               for (int i = 0; i < DIM; i++)

               {

                  for (int j = 0; j < DIM; j++)

                  {

                     H0(i,j,qx,qy,qz,e) = weight_m * gg(i,j);

                  }

               }

            }

         }

      }

   });

}


void TMOP_Integrator::AssembleGradPA_C0_3D(const Vector &X) const

{

   const int N = PA.ne;

   const int D1D = PA.maps_lim->ndof;

   const int Q1D = PA.maps_lim->nqpt;

   const int id = (D1D << 4 ) | Q1D;

   const real_t ln = lim_normal;

   const Vector &LD = PA.LD;

   const DenseTensor &J = PA.Jtr;

   const Array<real_t> &W = PA.ir->GetWeights();

   const Array<real_t> &B   = PA.maps->B;

   const Array<real_t> &BLD = PA.maps_lim->B;

   const Vector &C0 = PA.C0;

   const Vector &XL = PA.XL;

   Vector &H0 = PA.H0;


   auto el = dynamic_cast<TMOP_ExponentialLimiter *>(lim_func);

   const bool exp_lim = (el) ? true : false;


   MFEM_LAUNCH_TMOP_KERNEL(SetupGradPA_Kernel_C0_3D,id,ln,LD,C0,N,J,W,B,BLD,XL,X,

                           H0,exp_lim);

}


} // namespace mfem

mfem::Array
Definition array.hpp:47

mfem::Array::Read
const T * Read(bool on_dev=true) const
Shortcut for mfem::Read(a.GetMemory(), a.Size(), on_dev).
Definition array.hpp:337

mfem::DenseTensor
Rank 3 tensor (array of matrices)
Definition densemat.hpp:1112

mfem::DenseTensor::Read
const real_t * Read(bool on_dev=true) const
Shortcut for mfem::Read( GetMemory(), TotalSize(), on_dev).
Definition densemat.hpp:1270

mfem::DeviceTensor
A basic generic Tensor class, appropriate for use on the GPU.
Definition dtensor.hpp:82

mfem::TMOP_ExponentialLimiter
Exponential limiter function in TMOP_Integrator.
Definition tmop.hpp:1349

mfem::TMOP_Integrator::H0
Vector H0
Definition tmop.hpp:2019

mfem::TMOP_Integrator::lim_func
TMOP_LimiterFunction * lim_func
Definition tmop.hpp:1920

mfem::TMOP_Integrator::lim_normal
real_t lim_normal
Definition tmop.hpp:1922

mfem::TMOP_Integrator::XL
Vector XL
Definition tmop.hpp:2019

mfem::TMOP_Integrator::C0
Vector C0
Definition tmop.hpp:2019

mfem::TMOP_Integrator::AssembleGradPA_C0_3D
void AssembleGradPA_C0_3D(const Vector &) const
Definition tmop_pa_h3s_c0.cpp:169

mfem::TMOP_Integrator::PA
struct mfem::TMOP_Integrator::@26 PA

mfem::TMOP_Integrator::LD
Vector LD
Definition tmop.hpp:2019

mfem::Vector
Vector data type.
Definition vector.hpp:82

mfem::Vector::Read
virtual const real_t * Read(bool on_dev=true) const
Shortcut for mfem::Read(vec.GetMemory(), vec.Size(), on_dev).
Definition vector.hpp:494

mfem::Vector::Size
int Size() const
Returns the size of the vector.
Definition vector.hpp:226

mfem::Vector::Write
virtual real_t * Write(bool on_dev=true)
Shortcut for mfem::Write(vec.GetMemory(), vec.Size(), on_dev).
Definition vector.hpp:502

forall.hpp

kernels.hpp

linearform.hpp

b
real_t b
Definition lissajous.cpp:42

DIM
constexpr int DIM
Definition minimal-surface.cpp:72

mfem::kernels::DistanceSquared
MFEM_HOST_DEVICE real_t DistanceSquared(const real_t *x, const real_t *y)
Compute the square of the Euclidean distance to another vector.
Definition kernels.hpp:40

mfem::kernels::Diag
MFEM_HOST_DEVICE void Diag(const real_t c, real_t *data)
Creates n x n diagonal matrix with diagonal elements c.
Definition kernels.hpp:49

mfem::kernels::Det
MFEM_HOST_DEVICE T Det(const T *data)
Compute the determinant of a square matrix of size dim with given data.
Definition kernels.hpp:237

mfem::kernels::Subtract
MFEM_HOST_DEVICE void Subtract(const real_t a, const real_t *x, const real_t *y, real_t *z)
Vector subtraction operation: z = a * (x - y)
Definition kernels.hpp:58

mfem
Definition CodeDocumentation.dox:1

mfem::MFEM_REGISTER_TMOP_KERNELS
MFEM_REGISTER_TMOP_KERNELS(void, DatcSize, const int NE, const int ncomp, const int sizeidx, const real_t input_min_size, const DenseMatrix &w_, const Array< real_t > &b_, const Vector &x_, const Vector &nc_reduce, DenseTensor &j_, const int d1d, const int q1d)
Definition tmop_pa_da3.cpp:20

mfem::Reshape
MFEM_HOST_DEVICE DeviceTensor< sizeof...(Dims), T > Reshape(T *ptr, Dims... dims)
Wrap a pointer as a DeviceTensor with automatically deduced template parameters.
Definition dtensor.hpp:131

mfem::forall_3D
void forall_3D(int N, int X, int Y, int Z, lambda &&body)
Definition forall.hpp:774

mfem::real_t
float real_t
Definition config.hpp:43

mfem::f
std::function< real_t(const Vector &)> f(real_t mass_coeff)
Definition lor_mms.hpp:30

tmop.hpp

tmop_pa.hpp