4.6/lor__batched_8cpp_source.html

 // Copyright (c) 2010-2023, Lawrence Livermore National Security, LLC. Produced
 // at the Lawrence Livermore National Laboratory. All Rights reserved. See files
 // LICENSE and NOTICE for details. LLNL-CODE-806117.
 //
 // This file is part of the MFEM library. For more information and source code
 // availability visit https://mfem.org.
 //
 // MFEM is free software; you can redistribute it and/or modify it under the
 // terms of the BSD-3 license. We welcome feedback and contributions, see file
 // CONTRIBUTING.md for details.

 #include "lor_batched.hpp"
 #include "../../fem/quadinterpolator.hpp"
 #include "../../general/forall.hpp"
 #include <climits>
 #include "../pbilinearform.hpp"

 // Specializations
 #include "lor_h1.hpp"
 #include "lor_nd.hpp"
 #include "lor_rt.hpp"

 namespace mfem
 {

 template <typename T1, typename T2>
 bool HasIntegrators(BilinearForm &a)
 {
    Array<BilinearFormIntegrator*> *integs = a.GetDBFI();
    if (integs == NULL) { return false; }
    if (integs->Size() == 1)
    {
       BilinearFormIntegrator *i0 = (*integs)[0];
       if (dynamic_cast<T1*>(i0) || dynamic_cast<T2*>(i0)) { return true; }
    }
    else if (integs->Size() == 2)
    {
       BilinearFormIntegrator *i0 = (*integs)[0];
       BilinearFormIntegrator *i1 = (*integs)[1];
       if ((dynamic_cast<T1*>(i0) && dynamic_cast<T2*>(i1)) ||
           (dynamic_cast<T2*>(i0) && dynamic_cast<T1*>(i1)))
       {
          return true;
       }
    }
    return false;
 }

 bool BatchedLORAssembly::FormIsSupported(BilinearForm &a)
 {
    const FiniteElementCollection *fec = a.FESpace()->FEColl();
    // TODO: check for maximum supported orders

    // Batched LOR requires all tensor elements
    if (!UsesTensorBasis(*a.FESpace())) { return false; }

    if (dynamic_cast<const H1_FECollection*>(fec))
    {
       if (HasIntegrators<DiffusionIntegrator, MassIntegrator>(a)) { return true; }
    }
    else if (dynamic_cast<const ND_FECollection*>(fec))
    {
       if (HasIntegrators<CurlCurlIntegrator, VectorFEMassIntegrator>(a)) { return true; }
    }
    else if (dynamic_cast<const RT_FECollection*>(fec))
    {
       if (HasIntegrators<DivDivIntegrator, VectorFEMassIntegrator>(a)) { return true; }
    }
    return false;
 }

 void BatchedLORAssembly::FormLORVertexCoordinates(FiniteElementSpace &fes_ho,
                                                   Vector &X_vert)
 {
    Mesh &mesh_ho = *fes_ho.GetMesh();
    mesh_ho.EnsureNodes();

    // Get nodal points at the LOR vertices
    const int dim = mesh_ho.Dimension();
    const int nel_ho = mesh_ho.GetNE();
    const int order = fes_ho.GetMaxElementOrder();
    const int nd1d = order + 1;
    const int ndof_per_el = static_cast<int>(pow(nd1d, dim));

    const GridFunction *nodal_gf = mesh_ho.GetNodes();
    const FiniteElementSpace *nodal_fes = nodal_gf->FESpace();
    const Operator *nodal_restriction =
       nodal_fes->GetElementRestriction(ElementDofOrdering::LEXICOGRAPHIC);

    // Map from nodal L-vector to E-vector
    Vector nodal_evec(nodal_restriction->Height());
    nodal_restriction->Mult(*nodal_gf, nodal_evec);

    IntegrationRule ir = GetCollocatedIntRule(fes_ho);

    // Map from nodal E-vector to Q-vector at the LOR vertex points
    X_vert.SetSize(dim*ndof_per_el*nel_ho);
    const QuadratureInterpolator *quad_interp =
       nodal_fes->GetQuadratureInterpolator(ir);
    quad_interp->SetOutputLayout(QVectorLayout::byVDIM);
    quad_interp->Values(nodal_evec, X_vert);
 }

 // The following two functions (GetMinElt and GetAndIncrementNnzIndex) are
 // copied from restriction.cpp. Should they be factored out?

 // Return the minimal value found in both my_elts and nbr_elts
 static MFEM_HOST_DEVICE int GetMinElt(const int *my_elts, const int n_my_elts,
                                       const int *nbr_elts, const int n_nbr_elts)
 {
    int min_el = INT_MAX;
    for (int i = 0; i < n_my_elts; i++)
    {
       const int e_i = my_elts[i];
       if (e_i >= min_el) { continue; }
       for (int j = 0; j < n_nbr_elts; j++)
       {
          if (e_i==nbr_elts[j])
          {
             min_el = e_i; // we already know e_i < min_el
             break;
          }
       }
    }
    return min_el;
 }

 // Returns the index where a non-zero entry should be added and increment the
 // number of non-zeros for the row i_L.
 static MFEM_HOST_DEVICE int GetAndIncrementNnzIndex(const int i_L, int* I)
 {
    int ind = AtomicAdd(I[i_L],1);
    return ind;
 }

 int BatchedLORAssembly::FillI(SparseMatrix &A) const
 {
    static constexpr int Max = 16;

    const int nvdof = fes_ho.GetVSize();

    const int ndof_per_el = fes_ho.GetFE(0)->GetDof();
    const int nel_ho = fes_ho.GetNE();
    const int nnz_per_row = sparse_mapping.Size()/ndof_per_el;

    const ElementDofOrdering ordering = ElementDofOrdering::LEXICOGRAPHIC;
    const Operator *op = fes_ho.GetElementRestriction(ordering);
    const ElementRestriction *el_restr =
       dynamic_cast<const ElementRestriction*>(op);
    MFEM_VERIFY(el_restr != nullptr, "Bad element restriction");

    const Array<int> &el_dof_lex_ = el_restr->GatherMap();
    const Array<int> &dof_glob2loc_ = el_restr->Indices();
    const Array<int> &dof_glob2loc_offsets_ = el_restr->Offsets();

    const auto el_dof_lex = Reshape(el_dof_lex_.Read(), ndof_per_el, nel_ho);
    const auto dof_glob2loc = dof_glob2loc_.Read();
    const auto K = dof_glob2loc_offsets_.Read();
    const auto map = Reshape(sparse_mapping.Read(), nnz_per_row, ndof_per_el);

    auto I = A.WriteI();

    mfem::forall(nvdof + 1, [=] MFEM_HOST_DEVICE (int ii) { I[ii] = 0; });
    mfem::forall(ndof_per_el*nel_ho, [=] MFEM_HOST_DEVICE (int i)
    {
       const int ii_el = i%ndof_per_el;
       const int iel_ho = i/ndof_per_el;
       const int sii = el_dof_lex(ii_el, iel_ho);
       const int ii = (sii >= 0) ? sii : -1 -sii;
       // Get number and list of elements containing this DOF
       int i_elts[Max];
       const int i_offset = K[ii];
       const int i_next_offset = K[ii+1];
       const int i_ne = i_next_offset - i_offset;
       for (int e_i = 0; e_i < i_ne; ++e_i)
       {
          const int si_E = dof_glob2loc[i_offset+e_i]; // signed
          const int i_E = (si_E >= 0) ? si_E : -1 - si_E;
          i_elts[e_i] = i_E/ndof_per_el;
       }
       for (int j = 0; j < nnz_per_row; ++j)
       {
          int jj_el = map(j, ii_el);
          if (jj_el < 0) { continue; }
          // LDOF index of column
          const int sjj = el_dof_lex(jj_el, iel_ho); // signed
          const int jj = (sjj >= 0) ? sjj : -1 - sjj;
          const int j_offset = K[jj];
          const int j_next_offset = K[jj+1];
          const int j_ne = j_next_offset - j_offset;
          if (i_ne == 1 || j_ne == 1) // no assembly required
          {
             AtomicAdd(I[ii], 1);
          }
          else // assembly required
          {
             int j_elts[Max];
             for (int e_j = 0; e_j < j_ne; ++e_j)
             {
                const int sj_E = dof_glob2loc[j_offset+e_j]; // signed
                const int j_E = (sj_E >= 0) ? sj_E : -1 - sj_E;
                const int elt = j_E/ndof_per_el;
                j_elts[e_j] = elt;
             }
             const int min_e = GetMinElt(i_elts, i_ne, j_elts, j_ne);
             if (iel_ho == min_e) // add the nnz only once
             {
                AtomicAdd(I[ii], 1);
             }
          }
       }
    });
    // TODO: on device, this is a scan operation
    // We need to sum the entries of I, we do it on CPU as it is very sequential.
    auto h_I = A.HostReadWriteI();
    int sum = 0;
    for (int i = 0; i < nvdof; i++)
    {
       const int nnz = h_I[i];
       h_I[i] = sum;
       sum+=nnz;
    }
    h_I[nvdof] = sum;

    // Return the number of nnz
    return h_I[nvdof];
 }

 void BatchedLORAssembly::FillJAndData(SparseMatrix &A) const
 {
    const int nvdof = fes_ho.GetVSize();
    const int ndof_per_el = fes_ho.GetFE(0)->GetDof();
    const int nel_ho = fes_ho.GetNE();
    const int nnz_per_row = sparse_mapping.Size()/ndof_per_el;

    const ElementDofOrdering ordering = ElementDofOrdering::LEXICOGRAPHIC;
    const Operator *op = fes_ho.GetElementRestriction(ordering);
    const ElementRestriction *el_restr =
       dynamic_cast<const ElementRestriction*>(op);
    MFEM_VERIFY(el_restr != nullptr, "Bad element restriction");

    const Array<int> &el_dof_lex_ = el_restr->GatherMap();
    const Array<int> &dof_glob2loc_ = el_restr->Indices();
    const Array<int> &dof_glob2loc_offsets_ = el_restr->Offsets();

    const auto el_dof_lex = Reshape(el_dof_lex_.Read(), ndof_per_el, nel_ho);
    const auto dof_glob2loc = dof_glob2loc_.Read();
    const auto K = dof_glob2loc_offsets_.Read();

    const auto V = Reshape(sparse_ij.Read(), nnz_per_row, ndof_per_el, nel_ho);
    const auto map = Reshape(sparse_mapping.Read(), nnz_per_row, ndof_per_el);

    Array<int> I_(nvdof + 1);
    const auto I = I_.Write();
    const auto J = A.WriteJ();
    auto AV = A.WriteData();

    // Copy A.I into I, use it as a temporary buffer
    {
       const auto I2 = A.ReadI();
       mfem::forall(nvdof + 1, [=] MFEM_HOST_DEVICE (int i) { I[i] = I2[i]; });
    }

    static constexpr int Max = 16;

    mfem::forall(ndof_per_el*nel_ho, [=] MFEM_HOST_DEVICE (int i)
    {
       const int ii_el = i%ndof_per_el;
       const int iel_ho = i/ndof_per_el;
       // LDOF index of current row
       const int sii = el_dof_lex(ii_el, iel_ho); // signed
       const int ii = (sii >= 0) ? sii : -1 - sii;
       // Get number and list of elements containing this DOF
       int i_elts[Max];
       int i_B[Max];
       const int i_offset = K[ii];
       const int i_next_offset = K[ii+1];
       const int i_ne = i_next_offset - i_offset;
       for (int e_i = 0; e_i < i_ne; ++e_i)
       {
          const int si_E = dof_glob2loc[i_offset+e_i]; // signed
          const bool plus = si_E >= 0;
          const int i_E = plus ? si_E : -1 - si_E;
          i_elts[e_i] = i_E/ndof_per_el;
          const int i_Bi = i_E % ndof_per_el;
          i_B[e_i] = plus ? i_Bi : -1 - i_Bi; // encode with sign
       }
       for (int j=0; j<nnz_per_row; ++j)
       {
          int jj_el = map(j, ii_el);
          if (jj_el < 0) { continue; }
          // LDOF index of column
          const int sjj = el_dof_lex(jj_el, iel_ho); // signed
          const int jj = (sjj >= 0) ? sjj : -1 - sjj;
          const int sgn = ((sjj >=0 && sii >= 0) || (sjj < 0 && sii <0)) ? 1 : -1;
          const int j_offset = K[jj];
          const int j_next_offset = K[jj+1];
          const int j_ne = j_next_offset - j_offset;
          if (i_ne == 1 || j_ne == 1) // no assembly required
          {
             const int nnz = GetAndIncrementNnzIndex(ii, I);
             J[nnz] = jj;
             AV[nnz] = sgn*V(j, ii_el, iel_ho);
          }
          else // assembly required
          {
             int j_elts[Max];
             int j_B[Max];
             for (int e_j = 0; e_j < j_ne; ++e_j)
             {
                const int sj_E = dof_glob2loc[j_offset+e_j]; // signed
                const bool plus = sj_E >= 0;
                const int j_E = plus ? sj_E : -1 - sj_E;
                j_elts[e_j] = j_E/ndof_per_el;
                const int j_Bj = j_E % ndof_per_el;
                j_B[e_j] = plus ? j_Bj : -1 - j_Bj; // encode with sign
             }
             const int min_e = GetMinElt(i_elts, i_ne, j_elts, j_ne);
             if (iel_ho == min_e) // add the nnz only once
             {
                double val = 0.0;
                for (int k = 0; k < i_ne; k++)
                {
                   const int iel_ho_2 = i_elts[k];
                   const int sii_el_2 = i_B[k]; // signed
                   const int ii_el_2 = (sii_el_2 >= 0) ? sii_el_2 : -1 -sii_el_2;
                   for (int l = 0; l < j_ne; l++)
                   {
                      const int jel_ho_2 = j_elts[l];
                      if (iel_ho_2 == jel_ho_2)
                      {
                         const int sjj_el_2 = j_B[l]; // signed
                         const int jj_el_2 = (sjj_el_2 >= 0) ? sjj_el_2 : -1 -sjj_el_2;
                         const int sgn_2 = ((sjj_el_2 >=0 && sii_el_2 >= 0)
                                            || (sjj_el_2 < 0 && sii_el_2 <0)) ? 1 : -1;
                         int j2 = -1;
                         // find nonzero in matrix of other element
                         for (int m = 0; m < nnz_per_row; ++m)
                         {
                            if (map(m, ii_el_2) == jj_el_2)
                            {
                               j2 = m;
                               break;
                            }
                         }
                         MFEM_ASSERT_KERNEL(j >= 0, "Can't find nonzero");
                         val += sgn_2*V(j2, ii_el_2, iel_ho_2);
                      }
                   }
                }
                const int nnz = GetAndIncrementNnzIndex(ii, I);
                J[nnz] = jj;
                AV[nnz] = val;
             }
          }
       }
    });
 }

 void BatchedLORAssembly::SparseIJToCSR(OperatorHandle &A) const
 {
    const int nvdof = fes_ho.GetVSize();

    // If A contains an existing SparseMatrix, reuse it (and try to reuse its
    // I, J, A arrays if they are big enough)
    SparseMatrix *A_mat = A.Is<SparseMatrix>();
    if (!A_mat)
    {
       A_mat = new SparseMatrix;
       A.Reset(A_mat);
    }

    A_mat->OverrideSize(nvdof, nvdof);

    A_mat->GetMemoryI().New(nvdof+1, Device::GetDeviceMemoryType());
    int nnz = FillI(*A_mat);

    A_mat->GetMemoryJ().New(nnz, Device::GetDeviceMemoryType());
    A_mat->GetMemoryData().New(nnz, Device::GetDeviceMemoryType());
    FillJAndData(*A_mat);
 }

 template <typename LOR_KERNEL>
 void BatchedLORAssembly::AssemblyKernel(BilinearForm &a)
 {
    LOR_KERNEL kernel(a, fes_ho, X_vert, sparse_ij, sparse_mapping);

    const int dim = fes_ho.GetMesh()->Dimension();
    const int order = fes_ho.GetMaxElementOrder();

    if (dim == 2)
    {
       switch (order)
       {
          case 1: kernel.template Assemble2D<1>(); break;
          case 2: kernel.template Assemble2D<2>(); break;
          case 3: kernel.template Assemble2D<3>(); break;
          case 4: kernel.template Assemble2D<4>(); break;
          case 5: kernel.template Assemble2D<5>(); break;
          case 6: kernel.template Assemble2D<6>(); break;
          case 7: kernel.template Assemble2D<7>(); break;
          case 8: kernel.template Assemble2D<8>(); break;
          default: MFEM_ABORT("No kernel order " << order << "!");
       }
    }
    else if (dim == 3)
    {
       switch (order)
       {
          case 1: kernel.template Assemble3D<1>(); break;
          case 2: kernel.template Assemble3D<2>(); break;
          case 3: kernel.template Assemble3D<3>(); break;
          case 4: kernel.template Assemble3D<4>(); break;
          case 5: kernel.template Assemble3D<5>(); break;
          case 6: kernel.template Assemble3D<6>(); break;
          case 7: kernel.template Assemble3D<7>(); break;
          case 8: kernel.template Assemble3D<8>(); break;
          default: MFEM_ABORT("No kernel order " << order << "!");
       }
    }
 }

 void BatchedLORAssembly::AssembleWithoutBC(BilinearForm &a, OperatorHandle &A)
 {
    // Assemble the matrix, depending on what the form is.
    // This fills in the arrays sparse_ij and sparse_mapping.
    const FiniteElementCollection *fec = fes_ho.FEColl();
    if (dynamic_cast<const H1_FECollection*>(fec))
    {
       if (HasIntegrators<DiffusionIntegrator, MassIntegrator>(a))
       {
          AssemblyKernel<BatchedLOR_H1>(a);
       }
    }
    else if (dynamic_cast<const ND_FECollection*>(fec))
    {
       if (HasIntegrators<CurlCurlIntegrator, VectorFEMassIntegrator>(a))
       {
          AssemblyKernel<BatchedLOR_ND>(a);
       }
    }
    else if (dynamic_cast<const RT_FECollection*>(fec))
    {
       if (HasIntegrators<DivDivIntegrator, VectorFEMassIntegrator>(a))
       {
          AssemblyKernel<BatchedLOR_RT>(a);
       }
    }

    return SparseIJToCSR(A);
 }

 #ifdef MFEM_USE_MPI
 void BatchedLORAssembly::ParAssemble(
    BilinearForm &a, const Array<int> &ess_dofs, OperatorHandle &A)
 {
    // Assemble the system matrix local to this partition
    OperatorHandle A_local;
    AssembleWithoutBC(a, A_local);

    ParBilinearForm *pa =
       dynamic_cast<ParBilinearForm*>(&a);

    pa->ParallelRAP(*A_local.As<SparseMatrix>(), A, true);

    A.As<HypreParMatrix>()->EliminateBC(ess_dofs,
                                        Operator::DiagonalPolicy::DIAG_ONE);
 }
 #endif

 void BatchedLORAssembly::Assemble(
    BilinearForm &a, const Array<int> ess_dofs, OperatorHandle &A)
 {
 #ifdef MFEM_USE_MPI
    if (dynamic_cast<ParFiniteElementSpace*>(&fes_ho))
    {
       return ParAssemble(a, ess_dofs, A);
    }
 #endif

    AssembleWithoutBC(a, A);
    SparseMatrix *A_mat = A.As<SparseMatrix>();

    A_mat->EliminateBC(ess_dofs,
                       Operator::DiagonalPolicy::DIAG_KEEP);
 }

 BatchedLORAssembly::BatchedLORAssembly(FiniteElementSpace &fes_ho_)
    : fes_ho(fes_ho_)
 {
    FormLORVertexCoordinates(fes_ho, X_vert);
 }

 IntegrationRule GetCollocatedIntRule(FiniteElementSpace &fes)
 {
    IntegrationRules irs(0, Quadrature1D::GaussLobatto);
    const Geometry::Type geom = fes.GetMesh()->GetElementGeometry(0);
    const int nd1d = fes.GetMaxElementOrder() + 1;
    return irs.Get(geom, 2*nd1d - 3);
 }

 } // namespace mfem
mfem::Array::Read
const T * Read(bool on_dev=true) const
Shortcut for mfem::Read(a.GetMemory(), a.Size(), on_dev).
Definition: array.hpp:307

mfem::BatchedLORAssembly::ParAssemble
void ParAssemble(BilinearForm &a, const Array< int > &ess_dofs, OperatorHandle &A)
Assemble the system in parallel and place the result in A.
Definition: lor_batched.cpp:454

mfem::BatchedLORAssembly::fes_ho
FiniteElementSpace & fes_ho
The high-order space.
Definition: lor_batched.hpp:36

mfem::EliminateBC
void EliminateBC(const HypreParMatrix &A, const HypreParMatrix &Ae, const Array< int > &ess_dof_list, const Vector &X, Vector &B)
Eliminate essential BC specified by ess_dof_list from the solution X to the r.h.s. B.
Definition: hypre.cpp:3258

mfem::Mesh
Definition: mesh.hpp:52

mfem::IntegrationRule
Class for an integration rule - an Array of IntegrationPoint.
Definition: intrules.hpp:96

mfem::GridFunction
Class for grid function - Vector with associated FE space.
Definition: gridfunc.hpp:30

mfem::IntegrationRules::Get
const IntegrationRule & Get(int GeomType, int Order)
Returns an integration rule for given GeomType and Order.
Definition: intrules.cpp:980

mfem::Mesh::Dimension
int Dimension() const
Dimension of the reference space used within the elements.
Definition: mesh.hpp:1020

mfem::Vector::SetSize
void SetSize(int s)
Resize the vector to size s.
Definition: vector.hpp:517

mfem::OperatorHandle
Pointer to an Operator of a specified type.
Definition: handle.hpp:33

mfem::OperatorHandle::Is
OpType * Is() const
Return the Operator pointer dynamically cast to a specified OpType.
Definition: handle.hpp:108

mfem::Quadrature1D::GaussLobatto
Definition: intrules.hpp:397

mfem::ParBilinearForm::ParallelRAP
void ParallelRAP(SparseMatrix &loc_A, OperatorHandle &A, bool steal_loc_A=false)
Compute parallel RAP operator and store it in A as a HypreParMatrix.
Definition: pbilinearform.cpp:124

AtomicAdd
MFEM_HOST_DEVICE T AtomicAdd(T &add, const T val)
Definition: backends.hpp:84

mfem::IntegrationRules
Container class for integration rules.
Definition: intrules.hpp:412

mfem::Vector::Read
virtual const double * Read(bool on_dev=true) const
Shortcut for mfem::Read(vec.GetMemory(), vec.Size(), on_dev).
Definition: vector.hpp:453

mfem::Operator::Mult
virtual void Mult(const Vector &x, Vector &y) const =0
Operator application: y=A(x).

mfem::UsesTensorBasis
bool UsesTensorBasis(const FiniteElementSpace &fes)
Return true if the mesh contains only one topology and the elements are tensor elements.
Definition: fespace.hpp:1306

mfem::SparseMatrix::GetMemoryData
Memory< double > & GetMemoryData()
Definition: sparsemat.hpp:269

mfem::BatchedLORAssembly::FormIsSupported
static bool FormIsSupported(BilinearForm &a)
Returns true if the form a supports batched assembly, false otherwise.
Definition: lor_batched.cpp:49

mfem::SparseMatrix::GetMemoryI
Memory< int > & GetMemoryI()
Definition: sparsemat.hpp:237

mfem::FiniteElementSpace::GetFE
virtual const FiniteElement * GetFE(int i) const
Returns pointer to the FiniteElement in the FiniteElementCollection associated with i&#39;th element in t...
Definition: fespace.cpp:2841

mfem::BatchedLORAssembly::FormLORVertexCoordinates
static void FormLORVertexCoordinates(FiniteElementSpace &fes_ho, Vector &X_vert)
Compute the vertices of the LOR mesh and place the result in X_vert.
Definition: lor_batched.cpp:72

mfem::BatchedLORAssembly::FillI
int FillI(SparseMatrix &A) const
Fill the I array of the sparse matrix A.
Definition: lor_batched.cpp:136

mfem::FiniteElementSpace::GetElementRestriction
const ElementRestrictionOperator * GetElementRestriction(ElementDofOrdering e_ordering) const
Return an Operator that converts L-vectors to E-vectors.
Definition: fespace.cpp:1302

mfem::SparseMatrix::GetMemoryJ
Memory< int > & GetMemoryJ()
Definition: sparsemat.hpp:253

mfem::HasIntegrators
bool HasIntegrators(BilinearForm &a)
Definition: lor_batched.cpp:27

mfem::ElementRestriction::GatherMap
const Array< int > & GatherMap() const
Definition: restriction.hpp:97

mfem::FiniteElementSpace::GetMaxElementOrder
int GetMaxElementOrder() const
Return the maximum polynomial order.
Definition: fespace.hpp:573

mfem::SparseMatrix
Data type sparse matrix.
Definition: sparsemat.hpp:50

mfem
Definition: CodeDocumentation.dox:1

mfem::FiniteElementSpace::FEColl
const FiniteElementCollection * FEColl() const
Definition: fespace.hpp:723

mfem::QuadratureInterpolator
A class that performs interpolation from an E-vector to quadrature point values and/or derivatives (Q...
Definition: quadinterpolator.hpp:29

mfem::Array
Definition: adios2stream.hpp:44

lor_h1.hpp

mfem::Device::GetDeviceMemoryType
static MemoryType GetDeviceMemoryType()
Get the current Device MemoryType. This is the MemoryType used by most MFEM classes when allocating m...
Definition: device.hpp:273

mfem::BatchedLORAssembly::sparse_ij
Vector sparse_ij
The elementwise LOR matrices in a sparse "ij" format.
Definition: lor_batched.hpp:45

mfem::ElementRestriction::Offsets
const Array< int > & Offsets() const
Definition: restriction.hpp:99

mfem::BatchedLORAssembly::X_vert
Vector X_vert
LOR vertex coordinates.
Definition: lor_batched.hpp:38

mfem::BatchedLORAssembly::sparse_mapping
Array< int > sparse_mapping
The sparsity pattern of the element matrices.
Definition: lor_batched.hpp:54

lor_rt.hpp

mfem::SparseMatrix::WriteI
int * WriteI(bool on_dev=true)
Definition: sparsemat.hpp:241

mfem::GridFunction::FESpace
FiniteElementSpace * FESpace()
Definition: gridfunc.hpp:691

mfem::FiniteElementSpace::GetNE
int GetNE() const
Returns number of elements in the mesh.
Definition: fespace.hpp:736

lor_nd.hpp

mfem::Mesh::GetElementGeometry
Geometry::Type GetElementGeometry(int i) const
Definition: mesh.hpp:1228

mfem::FiniteElementSpace::GetMesh
Mesh * GetMesh() const
Returns the mesh.
Definition: fespace.hpp:555

mfem::BilinearFormIntegrator
Abstract base class BilinearFormIntegrator.
Definition: bilininteg.hpp:24

mfem::SparseMatrix::ReadI
const int * ReadI(bool on_dev=true) const
Definition: sparsemat.hpp:239

mfem::forall
void forall(int N, lambda &&body)
Definition: forall.hpp:742

mfem::ElementRestriction
Operator that converts FiniteElementSpace L-vectors to E-vectors.
Definition: restriction.hpp:37

mfem::FiniteElementSpace
Class FiniteElementSpace - responsible for providing FEM view of the mesh, mainly managing the set of...
Definition: fespace.hpp:219

mfem::QuadratureInterpolator::Values
void Values(const Vector &e_vec, Vector &q_val) const
Interpolate the values of the E-vector e_vec at quadrature points.
Definition: quadinterpolator.cpp:699

mfem::BatchedLORAssembly::FillJAndData
void FillJAndData(SparseMatrix &A) const
Fill the J and data arrays of the sparse matrix A.
Definition: lor_batched.cpp:229

mfem::FiniteElementCollection
Collection of finite elements from the same family in multiple dimensions. This class is used to matc...
Definition: fe_coll.hpp:26

mfem::BatchedLORAssembly::Assemble
void Assemble(BilinearForm &a, const Array< int > ess_dofs, OperatorHandle &A)
Assemble the given form as a matrix and place the result in A.
Definition: lor_batched.cpp:471

mfem::FiniteElement::GetDof
int GetDof() const
Returns the number of degrees of freedom in the finite element.
Definition: fe_base.hpp:323

mfem::Operator::Height
int Height() const
Get the height (size of output) of the Operator. Synonym with NumRows().
Definition: operator.hpp:66

mfem::SparseMatrix::WriteJ
int * WriteJ(bool on_dev=true)
Definition: sparsemat.hpp:257

mfem::Mesh::GetNE
int GetNE() const
Returns number of elements.
Definition: mesh.hpp:1086

a
double a
Definition: lissajous.cpp:41

mfem::BilinearForm
A "square matrix" operator for the associated FE space and BLFIntegrators The sum of all the BLFInteg...
Definition: bilinearform.hpp:60

mfem::FiniteElementSpace::GetQuadratureInterpolator
const QuadratureInterpolator * GetQuadratureInterpolator(const IntegrationRule &ir) const
Return a QuadratureInterpolator that interpolates E-vectors to quadrature point values and/or derivat...
Definition: fespace.cpp:1370

mfem::OperatorHandle::As
OpType * As() const
Return the Operator pointer statically cast to a specified OpType. Similar to the method Get()...
Definition: handle.hpp:104

mfem::Memory::New
void New(int size)
Allocate host memory for size entries with the current host memory type returned by MemoryManager::Ge...
Definition: mem_manager.hpp:888

mfem::ElementDofOrdering
ElementDofOrdering
Constants describing the possible orderings of the DOFs in one element.
Definition: fespace.hpp:74

dim
int dim
Definition: ex24.cpp:53

lor_batched.hpp

mfem::SparseMatrix::OverrideSize
void OverrideSize(int height_, int width_)
Sets the height and width of the matrix.
Definition: sparsemat.cpp:297

mfem::FiniteElementSpace::GetVSize
int GetVSize() const
Return the number of vector dofs, i.e. GetNDofs() x GetVDim().
Definition: fespace.hpp:709

mfem::ElementDofOrdering::LEXICOGRAPHIC
Lexicographic ordering for tensor-product FiniteElements.

mfem::ParBilinearForm
Class for parallel bilinear form.
Definition: pbilinearform.hpp:28

mfem::Array::Size
int Size() const
Return the logical size of the array.
Definition: array.hpp:141

mfem::BatchedLORAssembly::AssembleWithoutBC
void AssembleWithoutBC(BilinearForm &a, OperatorHandle &A)
Assemble the system without eliminating essential DOFs.
Definition: lor_batched.cpp:423

mfem::Vector
Vector data type.
Definition: vector.hpp:58

mfem::BatchedLORAssembly::BatchedLORAssembly
BatchedLORAssembly(FiniteElementSpace &fes_ho_)
Construct the batched assembly object corresponding to fes_ho_.
Definition: lor_batched.cpp:488

mfem::Mesh::GetNodes
void GetNodes(Vector &node_coord) const
Definition: mesh.cpp:8302

mfem::SparseMatrix::HostReadWriteI
int * HostReadWriteI()
Definition: sparsemat.hpp:249

mfem::QuadratureInterpolator::SetOutputLayout
void SetOutputLayout(QVectorLayout layout) const
Set the desired output Q-vector layout. The default value is QVectorLayout::byNODES.
Definition: quadinterpolator.hpp:92

mfem::ElementRestriction::Indices
const Array< int > & Indices() const
Definition: restriction.hpp:98

mfem::Operator
Abstract operator.
Definition: operator.hpp:24

mfem::HypreParMatrix
Wrapper for hypre&#39;s ParCSR matrix class.
Definition: hypre.hpp:343

mfem::Reshape
MFEM_HOST_DEVICE DeviceTensor< sizeof...(Dims), T > Reshape(T *ptr, Dims... dims)
Wrap a pointer as a DeviceTensor with automatically deduced template parameters.
Definition: dtensor.hpp:131

mfem::GetCollocatedIntRule
IntegrationRule GetCollocatedIntRule(FiniteElementSpace &fes)
Definition: lor_batched.cpp:494

mfem::SparseMatrix::EliminateBC
void EliminateBC(const Array< int > &ess_dofs, DiagonalPolicy diag_policy)
Eliminate essential (Dirichlet) boundary conditions.
Definition: sparsemat.cpp:2315

mfem::BatchedLORAssembly::SparseIJToCSR
void SparseIJToCSR(OperatorHandle &A) const
After assembling the "sparse IJ" format, convert it to CSR.
Definition: lor_batched.cpp:360

mfem::Mesh::EnsureNodes
void EnsureNodes()
Make sure that the mesh has valid nodes, i.e. its geometry is described by a vector finite element gr...
Definition: mesh.cpp:5583

mfem::OperatorHandle::Reset
void Reset(OpType *A, bool own_A=true)
Reset the OperatorHandle to the given OpType pointer, A.
Definition: handle.hpp:145

mfem::QVectorLayout::byVDIM
VDIM x NQPT x NE (values) / VDIM x DIM x NQPT x NE (grads)

mfem::Geometry::Type
Type
Definition: geom.hpp:35

mfem::SparseMatrix::WriteData
double * WriteData(bool on_dev=true)
Definition: sparsemat.hpp:273

mfem::BatchedLORAssembly::AssemblyKernel
void AssemblyKernel(BilinearForm &a)
Fill in sparse_ij and sparse_mapping using one of the specialized LOR assembly kernel classes...
Definition: lor_batched.cpp:384