html/interpolate__local__3_8cpp_source.html

// Copyright (c) 2010-2025, Lawrence Livermore National Security, LLC. Produced

// at the Lawrence Livermore National Laboratory. All Rights reserved. See files

// LICENSE and NOTICE for details. LLNL-CODE-806117.

//

// This file is part of the MFEM library. For more information and source code

// availability visit https://mfem.org.

//

// MFEM is free software; you can redistribute it and/or modify it under the

// terms of the BSD-3 license. We welcome feedback and contributions, see file

// CONTRIBUTING.md for details.


#include "../gslib.hpp"

#include "../../general/forall.hpp"


#ifdef MFEM_USE_GSLIB


#ifdef MFEM_HAVE_GCC_PRAGMA_DIAGNOSTIC

#pragma GCC diagnostic push

#pragma GCC diagnostic ignored "-Wunused-function"

#endif

#include "gslib.h"

#ifndef GSLIB_RELEASE_VERSION //gslib v1.0.7

#define GSLIB_RELEASE_VERSION 10007

#endif

#ifdef MFEM_HAVE_GCC_PRAGMA_DIAGNOSTIC

#pragma GCC diagnostic pop

#endif

namespace mfem

{

#if GSLIB_RELEASE_VERSION >= 10009

#define CODE_INTERNAL 0

#define CODE_BORDER 1

#define CODE_NOT_FOUND 2


static MFEM_HOST_DEVICE void lagrange_eval(double *p0, double x,

                                           int i, int p_Nq,

                                           double *z, double *lagrangeCoeff)

{

   double p_i = (1 << (p_Nq - 1));

   for (int j = 0; j < p_Nq; ++j)

   {

      double d_j = x - z[j];

      p_i *= j == i ? 1 : d_j;

   }

   p0[i] = lagrangeCoeff[i] * p_i;

}


template<int T_D1D = 0>

static void InterpolateLocal3DKernel(const double *const gf_in,

                                     int *const el,

                                     double *const r,

                                     double *const int_out,

                                     const int npt,

                                     const int ncomp,

                                     const int nel,

                                     const int gf_offset,

                                     double *gll1D,

                                     double *lagcoeff,

                                     const int pN = 0)

{

   const int Nfields = ncomp;

   const int MD1 = T_D1D ? T_D1D : DofQuadLimits::MAX_D1D;

   const int D1D = T_D1D ? T_D1D : pN;

   const int p_Np = D1D*D1D*D1D;

   MFEM_VERIFY(MD1 <= DofQuadLimits::MAX_D1D,

               "Increase Max allowable polynomial order.");

   MFEM_VERIFY(D1D != 0, "Polynomial order not specified.");

#define MAXC(a, b) (((a) > (b)) ? (a) : (b))

   const int nThreadsy = MAXC(D1D, 3);

   mfem::forall_2D(npt, D1D, nThreadsy, [=] MFEM_HOST_DEVICE (int i)

   {

      MFEM_SHARED double wtr[3*MD1];

      MFEM_SHARED double sums[MD1*MD1];


      // Evaluate basis functions at the reference space coordinates

      MFEM_FOREACH_THREAD(j,x,D1D)

      {

         MFEM_FOREACH_THREAD(k,y,3)

         {

            lagrange_eval(wtr + k*D1D, r[3*i+k], j, D1D, gll1D, lagcoeff);

         }

      }

      MFEM_SYNC_THREAD;


      for (int fld = 0; fld < Nfields; ++fld)

      {

         // If using GetNodalValues, ordering is NDOFSxNELxVDIM

         // const int elemOffset = el[i] * p_Np + fld * gf_offset;

         //if using R->Mult for L -> E-Vec use below.

         const int elemOffset = el[i] * p_Np * Nfields + fld * p_Np;

         MFEM_FOREACH_THREAD(j,x,D1D)

         {

            MFEM_FOREACH_THREAD(k,y,D1D)

            {

               sums[j + k*D1D] = 0.0;

               for (int l = 0; l < D1D; ++l)

               {

                  sums[j + k*D1D] += gf_in[elemOffset + j + k*D1D + l*D1D*D1D] *

                                     wtr[2*D1D+l];

               }

               sums[j+k*D1D] *= wtr[D1D+k]*wtr[j];

            }

         }

         MFEM_SYNC_THREAD;


         MFEM_FOREACH_THREAD(j,x,1)

         {

            MFEM_FOREACH_THREAD(k,y,1)

            {

               double sumv = 0.0;

               for (int jj = 0; jj < D1D*D1D; ++jj)

               {

                  sumv += sums[jj];

               }

               int_out[i + fld * npt] = sumv;

            }

         }

         MFEM_SYNC_THREAD;

      }

   });

}


void FindPointsGSLIB::InterpolateLocal3(const Vector &field_in,

                                        Array<int> &gsl_elem_dev_l,

                                        Vector &gsl_ref_l,

                                        Vector &field_out,

                                        int npt, int ncomp,

                                        int nel, int dof1Dsol)

{

   if (npt == 0) { return; }

   const int gf_offset = field_in.Size()/ncomp;

   auto pfin = field_in.Read();

   auto pgsle = gsl_elem_dev_l.ReadWrite();

   auto pgslr = gsl_ref_l.ReadWrite();

   auto pfout = field_out.Write();

   auto pgll = DEV.gll1d_sol.ReadWrite();

   auto plcf = DEV.lagcoeff_sol.ReadWrite();

   switch (dof1Dsol)

   {

      case 2: return InterpolateLocal3DKernel<2>(pfin, pgsle, pgslr, pfout,

                                                    npt, ncomp, nel, gf_offset,

                                                    pgll, plcf);

      case 3: return InterpolateLocal3DKernel<3>(pfin, pgsle, pgslr, pfout,

                                                    npt, ncomp, nel, gf_offset,

                                                    pgll, plcf);

      case 4: return InterpolateLocal3DKernel<4>(pfin, pgsle, pgslr, pfout,

                                                    npt, ncomp, nel, gf_offset,

                                                    pgll, plcf);

      case 5: return InterpolateLocal3DKernel<5>(pfin, pgsle, pgslr, pfout,

                                                    npt, ncomp, nel, gf_offset,

                                                    pgll, plcf);

      default: return InterpolateLocal3DKernel(pfin, pgsle, pgslr, pfout,

                                                  npt, ncomp, nel, gf_offset,

                                                  pgll, plcf, dof1Dsol);

   }

}


#undef CODE_INTERNAL

#undef CODE_BORDER

#undef CODE_NOT_FOUND

#else

void FindPointsGSLIB::InterpolateLocal3(const Vector &field_in,

                                        Array<int> &gsl_elem_dev_l,

                                        Vector &gsl_ref_l,

                                        Vector &field_out,

                                        int npt, int ncomp,

                                        int nel, int dof1Dsol) {};

#endif

} // namespace mfem


#endif //ifdef MFEM_USE_GSLIB

mfem::Array
Definition array.hpp:48

mfem::Array::ReadWrite
T * ReadWrite(bool on_dev=true)
Shortcut for mfem::ReadWrite(a.GetMemory(), a.Size(), on_dev).
Definition array.hpp:397

mfem::FindPointsGSLIB::DEV
struct mfem::FindPointsGSLIB::@24 DEV

mfem::FindPointsGSLIB::InterpolateLocal3
void InterpolateLocal3(const Vector &field_in, Array< int > &gsl_elem_dev_l, Vector &gsl_ref_l, Vector &field_out, int npt, int ncomp, int nel, int dof1dsol)
Definition interpolate_local_3.cpp:123

mfem::Vector
Vector data type.
Definition vector.hpp:82

mfem::Vector::Read
virtual const real_t * Read(bool on_dev=true) const
Shortcut for mfem::Read(vec.GetMemory(), vec.Size(), on_dev).
Definition vector.hpp:520

mfem::Vector::ReadWrite
virtual real_t * ReadWrite(bool on_dev=true)
Shortcut for mfem::ReadWrite(vec.GetMemory(), vec.Size(), on_dev).
Definition vector.hpp:536

mfem::Vector::Size
int Size() const
Returns the size of the vector.
Definition vector.hpp:234

mfem::Vector::Write
virtual real_t * Write(bool on_dev=true)
Shortcut for mfem::Write(vec.GetMemory(), vec.Size(), on_dev).
Definition vector.hpp:528

forall.hpp

gslib.hpp

mfem
Definition CodeDocumentation.dox:1

mfem::forall_2D
void forall_2D(int N, int X, int Y, lambda &&body)
Definition forall.hpp:925