4.5/lor__batched_8cpp_source.html

 // Copyright (c) 2010-2022, Lawrence Livermore National Security, LLC. Produced

 // at the Lawrence Livermore National Laboratory. All Rights reserved. See files

 // LICENSE and NOTICE for details. LLNL-CODE-806117.

 //

 // This file is part of the MFEM library. For more information and source code

 // availability visit https://mfem.org.

 //

 // MFEM is free software; you can redistribute it and/or modify it under the

 // terms of the BSD-3 license. We welcome feedback and contributions, see file

 // CONTRIBUTING.md for details.


 #include "lor_batched.hpp"

 #include "../../fem/quadinterpolator.hpp"

 #include "../../general/forall.hpp"

 #include <climits>

 #include "../pbilinearform.hpp"


 // Specializations

 #include "lor_h1.hpp"

 #include "lor_nd.hpp"

 #include "lor_rt.hpp"


 namespace mfem

 {


 template <typename T1, typename T2>

 bool HasIntegrators(BilinearForm &a)

 {

    Array<BilinearFormIntegrator*> *integs = a.GetDBFI();

    if (integs == NULL) { return false; }

    if (integs->Size() == 1)

    {

       BilinearFormIntegrator *i0 = (*integs)[0];

       if (dynamic_cast<T1*>(i0) || dynamic_cast<T2*>(i0)) { return true; }

    }

    else if (integs->Size() == 2)

    {

       BilinearFormIntegrator *i0 = (*integs)[0];

       BilinearFormIntegrator *i1 = (*integs)[1];

       if ((dynamic_cast<T1*>(i0) && dynamic_cast<T2*>(i1)) ||

           (dynamic_cast<T2*>(i0) && dynamic_cast<T1*>(i1)))

       {

          return true;

       }

    }

    return false;

 }


 bool BatchedLORAssembly::FormIsSupported(BilinearForm &a)

 {

    const FiniteElementCollection *fec = a.FESpace()->FEColl();

    // TODO: check for maximum supported orders


    // Batched LOR requires all tensor elements

    if (!UsesTensorBasis(*a.FESpace())) { return false; }


    if (dynamic_cast<const H1_FECollection*>(fec))

    {

       if (HasIntegrators<DiffusionIntegrator, MassIntegrator>(a)) { return true; }

    }

    else if (dynamic_cast<const ND_FECollection*>(fec))

    {

       if (HasIntegrators<CurlCurlIntegrator, VectorFEMassIntegrator>(a)) { return true; }

    }

    else if (dynamic_cast<const RT_FECollection*>(fec))

    {

       if (HasIntegrators<DivDivIntegrator, VectorFEMassIntegrator>(a)) { return true; }

    }

    return false;

 }


 void BatchedLORAssembly::FormLORVertexCoordinates(FiniteElementSpace &fes_ho,

                                                   Vector &X_vert)

 {

    Mesh &mesh_ho = *fes_ho.GetMesh();

    mesh_ho.EnsureNodes();


    // Get nodal points at the LOR vertices

    const int dim = mesh_ho.Dimension();

    const int nel_ho = mesh_ho.GetNE();

    const int order = fes_ho.GetMaxElementOrder();

    const int nd1d = order + 1;

    const int ndof_per_el = static_cast<int>(pow(nd1d, dim));


    const GridFunction *nodal_gf = mesh_ho.GetNodes();

    const FiniteElementSpace *nodal_fes = nodal_gf->FESpace();

    const Operator *nodal_restriction =

       nodal_fes->GetElementRestriction(ElementDofOrdering::LEXICOGRAPHIC);


    // Map from nodal L-vector to E-vector

    Vector nodal_evec(nodal_restriction->Height());

    nodal_restriction->Mult(*nodal_gf, nodal_evec);


    IntegrationRule ir = GetCollocatedIntRule(fes_ho);


    // Map from nodal E-vector to Q-vector at the LOR vertex points

    X_vert.SetSize(dim*ndof_per_el*nel_ho);

    const QuadratureInterpolator *quad_interp =

       nodal_fes->GetQuadratureInterpolator(ir);

    quad_interp->SetOutputLayout(QVectorLayout::byVDIM);

    quad_interp->Values(nodal_evec, X_vert);

 }


 // The following two functions (GetMinElt and GetAndIncrementNnzIndex) are

 // copied from restriction.cpp. Should they be factored out?


 // Return the minimal value found in both my_elts and nbr_elts

 static MFEM_HOST_DEVICE int GetMinElt(const int *my_elts, const int n_my_elts,

                                       const int *nbr_elts, const int n_nbr_elts)

 {

    int min_el = INT_MAX;

    for (int i = 0; i < n_my_elts; i++)

    {

       const int e_i = my_elts[i];

       if (e_i >= min_el) { continue; }

       for (int j = 0; j < n_nbr_elts; j++)

       {

          if (e_i==nbr_elts[j])

          {

             min_el = e_i; // we already know e_i < min_el

             break;

          }

       }

    }

    return min_el;

 }


 // Returns the index where a non-zero entry should be added and increment the

 // number of non-zeros for the row i_L.

 static MFEM_HOST_DEVICE int GetAndIncrementNnzIndex(const int i_L, int* I)

 {

    int ind = AtomicAdd(I[i_L],1);

    return ind;

 }


 int BatchedLORAssembly::FillI(SparseMatrix &A) const

 {

    static constexpr int Max = 16;


    const int nvdof = fes_ho.GetVSize();


    const int ndof_per_el = fes_ho.GetFE(0)->GetDof();

    const int nel_ho = fes_ho.GetNE();

    const int nnz_per_row = sparse_mapping.Size()/ndof_per_el;


    const ElementDofOrdering ordering = ElementDofOrdering::LEXICOGRAPHIC;

    const Operator *op = fes_ho.GetElementRestriction(ordering);

    const ElementRestriction *el_restr =

       dynamic_cast<const ElementRestriction*>(op);

    MFEM_VERIFY(el_restr != nullptr, "Bad element restriction");


    const Array<int> &el_dof_lex_ = el_restr->GatherMap();

    const Array<int> &dof_glob2loc_ = el_restr->Indices();

    const Array<int> &dof_glob2loc_offsets_ = el_restr->Offsets();


    const auto el_dof_lex = Reshape(el_dof_lex_.Read(), ndof_per_el, nel_ho);

    const auto dof_glob2loc = dof_glob2loc_.Read();

    const auto K = dof_glob2loc_offsets_.Read();

    const auto map = Reshape(sparse_mapping.Read(), nnz_per_row, ndof_per_el);


    auto I = A.WriteI();


    MFEM_FORALL(ii, nvdof + 1, I[ii] = 0;);

    MFEM_FORALL(i, ndof_per_el*nel_ho,

    {

       const int ii_el = i%ndof_per_el;

       const int iel_ho = i/ndof_per_el;

       const int sii = el_dof_lex(ii_el, iel_ho);

       const int ii = (sii >= 0) ? sii : -1 -sii;

       // Get number and list of elements containing this DOF

       int i_elts[Max];

       const int i_offset = K[ii];

       const int i_next_offset = K[ii+1];

       const int i_ne = i_next_offset - i_offset;

       for (int e_i = 0; e_i < i_ne; ++e_i)

       {

          const int si_E = dof_glob2loc[i_offset+e_i]; // signed

          const int i_E = (si_E >= 0) ? si_E : -1 - si_E;

          i_elts[e_i] = i_E/ndof_per_el;

       }

       for (int j = 0; j < nnz_per_row; ++j)

       {

          int jj_el = map(j, ii_el);

          if (jj_el < 0) { continue; }

          // LDOF index of column

          const int sjj = el_dof_lex(jj_el, iel_ho); // signed

          const int jj = (sjj >= 0) ? sjj : -1 - sjj;

          const int j_offset = K[jj];

          const int j_next_offset = K[jj+1];

          const int j_ne = j_next_offset - j_offset;

          if (i_ne == 1 || j_ne == 1) // no assembly required

          {

             AtomicAdd(I[ii], 1);

          }

          else // assembly required

          {

             int j_elts[Max];

             for (int e_j = 0; e_j < j_ne; ++e_j)

             {

                const int sj_E = dof_glob2loc[j_offset+e_j]; // signed

                const int j_E = (sj_E >= 0) ? sj_E : -1 - sj_E;

                const int elt = j_E/ndof_per_el;

                j_elts[e_j] = elt;

             }

             const int min_e = GetMinElt(i_elts, i_ne, j_elts, j_ne);

             if (iel_ho == min_e) // add the nnz only once

             {

                AtomicAdd(I[ii], 1);

             }

          }

       }

    });

    // TODO: on device, this is a scan operation

    // We need to sum the entries of I, we do it on CPU as it is very sequential.

    auto h_I = A.HostReadWriteI();

    int sum = 0;

    for (int i = 0; i < nvdof; i++)

    {

       const int nnz = h_I[i];

       h_I[i] = sum;

       sum+=nnz;

    }

    h_I[nvdof] = sum;


    // Return the number of nnz

    return h_I[nvdof];

 }


 void BatchedLORAssembly::FillJAndData(SparseMatrix &A) const

 {

    const int nvdof = fes_ho.GetVSize();

    const int ndof_per_el = fes_ho.GetFE(0)->GetDof();

    const int nel_ho = fes_ho.GetNE();

    const int nnz_per_row = sparse_mapping.Size()/ndof_per_el;


    const ElementDofOrdering ordering = ElementDofOrdering::LEXICOGRAPHIC;

    const Operator *op = fes_ho.GetElementRestriction(ordering);

    const ElementRestriction *el_restr =

       dynamic_cast<const ElementRestriction*>(op);

    MFEM_VERIFY(el_restr != nullptr, "Bad element restriction");


    const Array<int> &el_dof_lex_ = el_restr->GatherMap();

    const Array<int> &dof_glob2loc_ = el_restr->Indices();

    const Array<int> &dof_glob2loc_offsets_ = el_restr->Offsets();


    const auto el_dof_lex = Reshape(el_dof_lex_.Read(), ndof_per_el, nel_ho);

    const auto dof_glob2loc = dof_glob2loc_.Read();

    const auto K = dof_glob2loc_offsets_.Read();


    const auto V = Reshape(sparse_ij.Read(), nnz_per_row, ndof_per_el, nel_ho);

    const auto map = Reshape(sparse_mapping.Read(), nnz_per_row, ndof_per_el);


    Array<int> I_(nvdof + 1);

    const auto I = I_.Write();

    const auto J = A.WriteJ();

    auto AV = A.WriteData();


    // Copy A.I into I, use it as a temporary buffer

    {

       const auto I2 = A.ReadI();

       MFEM_FORALL(i, nvdof + 1, I[i] = I2[i];);

    }


    static constexpr int Max = 16;


    MFEM_FORALL(i, ndof_per_el*nel_ho,

    {

       const int ii_el = i%ndof_per_el;

       const int iel_ho = i/ndof_per_el;

       // LDOF index of current row

       const int sii = el_dof_lex(ii_el, iel_ho); // signed

       const int ii = (sii >= 0) ? sii : -1 - sii;

       // Get number and list of elements containing this DOF

       int i_elts[Max];

       int i_B[Max];

       const int i_offset = K[ii];

       const int i_next_offset = K[ii+1];

       const int i_ne = i_next_offset - i_offset;

       for (int e_i = 0; e_i < i_ne; ++e_i)

       {

          const int si_E = dof_glob2loc[i_offset+e_i]; // signed

          const bool plus = si_E >= 0;

          const int i_E = plus ? si_E : -1 - si_E;

          i_elts[e_i] = i_E/ndof_per_el;

          const int i_Bi = i_E % ndof_per_el;

          i_B[e_i] = plus ? i_Bi : -1 - i_Bi; // encode with sign

       }

       for (int j=0; j<nnz_per_row; ++j)

       {

          int jj_el = map(j, ii_el);

          if (jj_el < 0) { continue; }

          // LDOF index of column

          const int sjj = el_dof_lex(jj_el, iel_ho); // signed

          const int jj = (sjj >= 0) ? sjj : -1 - sjj;

          const int sgn = ((sjj >=0 && sii >= 0) || (sjj < 0 && sii <0)) ? 1 : -1;

          const int j_offset = K[jj];

          const int j_next_offset = K[jj+1];

          const int j_ne = j_next_offset - j_offset;

          if (i_ne == 1 || j_ne == 1) // no assembly required

          {

             const int nnz = GetAndIncrementNnzIndex(ii, I);

             J[nnz] = jj;

             AV[nnz] = sgn*V(j, ii_el, iel_ho);

          }

          else // assembly required

          {

             int j_elts[Max];

             int j_B[Max];

             for (int e_j = 0; e_j < j_ne; ++e_j)

             {

                const int sj_E = dof_glob2loc[j_offset+e_j]; // signed

                const bool plus = sj_E >= 0;

                const int j_E = plus ? sj_E : -1 - sj_E;

                j_elts[e_j] = j_E/ndof_per_el;

                const int j_Bj = j_E % ndof_per_el;

                j_B[e_j] = plus ? j_Bj : -1 - j_Bj; // encode with sign

             }

             const int min_e = GetMinElt(i_elts, i_ne, j_elts, j_ne);

             if (iel_ho == min_e) // add the nnz only once

             {

                double val = 0.0;

                for (int k = 0; k < i_ne; k++)

                {

                   const int iel_ho_2 = i_elts[k];

                   const int sii_el_2 = i_B[k]; // signed

                   const int ii_el_2 = (sii_el_2 >= 0) ? sii_el_2 : -1 -sii_el_2;

                   for (int l = 0; l < j_ne; l++)

                   {

                      const int jel_ho_2 = j_elts[l];

                      if (iel_ho_2 == jel_ho_2)

                      {

                         const int sjj_el_2 = j_B[l]; // signed

                         const int jj_el_2 = (sjj_el_2 >= 0) ? sjj_el_2 : -1 -sjj_el_2;

                         const int sgn_2 = ((sjj_el_2 >=0 && sii_el_2 >= 0)

                                            || (sjj_el_2 < 0 && sii_el_2 <0)) ? 1 : -1;

                         int j2 = -1;

                         // find nonzero in matrix of other element

                         for (int m = 0; m < nnz_per_row; ++m)

                         {

                            if (map(m, ii_el_2) == jj_el_2)

                            {

                               j2 = m;

                               break;

                            }

                         }

                         MFEM_ASSERT_KERNEL(j >= 0, "Can't find nonzero");

                         val += sgn_2*V(j2, ii_el_2, iel_ho_2);

                      }

                   }

                }

                const int nnz = GetAndIncrementNnzIndex(ii, I);

                J[nnz] = jj;

                AV[nnz] = val;

             }

          }

       }

    });

 }


 void BatchedLORAssembly::SparseIJToCSR(OperatorHandle &A) const

 {

    const int nvdof = fes_ho.GetVSize();


    // If A contains an existing SparseMatrix, reuse it (and try to reuse its

    // I, J, A arrays if they are big enough)

    SparseMatrix *A_mat = A.Is<SparseMatrix>();

    if (!A_mat)

    {

       A_mat = new SparseMatrix;

       A.Reset(A_mat);

    }


    A_mat->OverrideSize(nvdof, nvdof);


    A_mat->GetMemoryI().New(nvdof+1, Device::GetDeviceMemoryType());

    int nnz = FillI(*A_mat);


    A_mat->GetMemoryJ().New(nnz, Device::GetDeviceMemoryType());

    A_mat->GetMemoryData().New(nnz, Device::GetDeviceMemoryType());

    FillJAndData(*A_mat);

 }


 template <typename LOR_KERNEL>

 void BatchedLORAssembly::AssemblyKernel(BilinearForm &a)

 {

    LOR_KERNEL kernel(a, fes_ho, X_vert, sparse_ij, sparse_mapping);


    const int dim = fes_ho.GetMesh()->Dimension();

    const int order = fes_ho.GetMaxElementOrder();


    if (dim == 2)

    {

       switch (order)

       {

          case 1: kernel.template Assemble2D<1>(); break;

          case 2: kernel.template Assemble2D<2>(); break;

          case 3: kernel.template Assemble2D<3>(); break;

          case 4: kernel.template Assemble2D<4>(); break;

          case 5: kernel.template Assemble2D<5>(); break;

          case 6: kernel.template Assemble2D<6>(); break;

          case 7: kernel.template Assemble2D<7>(); break;

          case 8: kernel.template Assemble2D<8>(); break;

          default: MFEM_ABORT("No kernel order " << order << "!");

       }

    }

    else if (dim == 3)

    {

       switch (order)

       {

          case 1: kernel.template Assemble3D<1>(); break;

          case 2: kernel.template Assemble3D<2>(); break;

          case 3: kernel.template Assemble3D<3>(); break;

          case 4: kernel.template Assemble3D<4>(); break;

          case 5: kernel.template Assemble3D<5>(); break;

          case 6: kernel.template Assemble3D<6>(); break;

          case 7: kernel.template Assemble3D<7>(); break;

          case 8: kernel.template Assemble3D<8>(); break;

          default: MFEM_ABORT("No kernel order " << order << "!");

       }

    }

 }


 void BatchedLORAssembly::AssembleWithoutBC(BilinearForm &a, OperatorHandle &A)

 {

    // Assemble the matrix, depending on what the form is.

    // This fills in the arrays sparse_ij and sparse_mapping.

    const FiniteElementCollection *fec = fes_ho.FEColl();

    if (dynamic_cast<const H1_FECollection*>(fec))

    {

       if (HasIntegrators<DiffusionIntegrator, MassIntegrator>(a))

       {

          AssemblyKernel<BatchedLOR_H1>(a);

       }

    }

    else if (dynamic_cast<const ND_FECollection*>(fec))

    {

       if (HasIntegrators<CurlCurlIntegrator, VectorFEMassIntegrator>(a))

       {

          AssemblyKernel<BatchedLOR_ND>(a);

       }

    }

    else if (dynamic_cast<const RT_FECollection*>(fec))

    {

       if (HasIntegrators<DivDivIntegrator, VectorFEMassIntegrator>(a))

       {

          AssemblyKernel<BatchedLOR_RT>(a);

       }

    }


    return SparseIJToCSR(A);

 }


 #ifdef MFEM_USE_MPI

 void BatchedLORAssembly::ParAssemble(

    BilinearForm &a, const Array<int> &ess_dofs, OperatorHandle &A)

 {

    // Assemble the system matrix local to this partition

    OperatorHandle A_local;

    AssembleWithoutBC(a, A_local);


    ParBilinearForm *pa =

       dynamic_cast<ParBilinearForm*>(&a);


    pa->ParallelRAP(*A_local.As<SparseMatrix>(), A, true);


    A.As<HypreParMatrix>()->EliminateBC(ess_dofs,

                                        Operator::DiagonalPolicy::DIAG_ONE);

 }

 #endif


 void BatchedLORAssembly::Assemble(

    BilinearForm &a, const Array<int> ess_dofs, OperatorHandle &A)

 {

 #ifdef MFEM_USE_MPI

    if (dynamic_cast<ParFiniteElementSpace*>(&fes_ho))

    {

       return ParAssemble(a, ess_dofs, A);

    }

 #endif


    AssembleWithoutBC(a, A);

    SparseMatrix *A_mat = A.As<SparseMatrix>();


    A_mat->EliminateBC(ess_dofs,

                       Operator::DiagonalPolicy::DIAG_KEEP);

 }


 BatchedLORAssembly::BatchedLORAssembly(FiniteElementSpace &fes_ho_)

    : fes_ho(fes_ho_)

 {

    FormLORVertexCoordinates(fes_ho, X_vert);

 }


 IntegrationRule GetCollocatedIntRule(FiniteElementSpace &fes)

 {

    IntegrationRules irs(0, Quadrature1D::GaussLobatto);

    const Geometry::Type geom = fes.GetMesh()->GetElementGeometry(0);

    const int nd1d = fes.GetMaxElementOrder() + 1;

    return irs.Get(geom, 2*nd1d - 3);

 }


 } // namespace mfem

mfem::Array::Size
int Size() const
Return the logical size of the array.
Definition: array.hpp:138

mfem::FiniteElementSpace::GetVSize
int GetVSize() const
Return the number of vector dofs, i.e. GetNDofs() x GetVDim().
Definition: fespace.hpp:587

mfem::BatchedLORAssembly::ParAssemble
void ParAssemble(BilinearForm &a, const Array< int > &ess_dofs, OperatorHandle &A)
Assemble the system in parallel and place the result in A.
Definition: lor_batched.cpp:454

mfem::BatchedLORAssembly::fes_ho
FiniteElementSpace & fes_ho
The high-order space.
Definition: lor_batched.hpp:36

mfem::OperatorHandle::As
OpType * As() const
Return the Operator pointer statically cast to a specified OpType. Similar to the method Get()...
Definition: handle.hpp:104

mfem::EliminateBC
void EliminateBC(const HypreParMatrix &A, const HypreParMatrix &Ae, const Array< int > &ess_dof_list, const Vector &X, Vector &B)
Eliminate essential BC specified by ess_dof_list from the solution X to the r.h.s. B.
Definition: hypre.cpp:3263

mfem::Mesh
Definition: mesh.hpp:52

mfem::IntegrationRule
Class for an integration rule - an Array of IntegrationPoint.
Definition: intrules.hpp:90

mfem::GridFunction
Class for grid function - Vector with associated FE space.
Definition: gridfunc.hpp:30

mfem::IntegrationRules::Get
const IntegrationRule & Get(int GeomType, int Order)
Returns an integration rule for given GeomType and Order.
Definition: intrules.cpp:923

mfem::BilinearForm::FESpace
FiniteElementSpace * FESpace()
Return the FE space associated with the BilinearForm.
Definition: bilinearform.hpp:660

mfem::BilinearForm::GetDBFI
Array< BilinearFormIntegrator * > * GetDBFI()
Access all the integrators added with AddDomainIntegrator().
Definition: bilinearform.hpp:255

mfem::Vector::SetSize
void SetSize(int s)
Resize the vector to size s.
Definition: vector.hpp:513

mfem::ElementRestriction::Indices
const Array< int > & Indices() const
Definition: restriction.hpp:62

mfem::OperatorHandle
Pointer to an Operator of a specified type.
Definition: handle.hpp:33

mfem::Quadrature1D::GaussLobatto
Definition: intrules.hpp:296

mfem::ParBilinearForm::ParallelRAP
void ParallelRAP(SparseMatrix &loc_A, OperatorHandle &A, bool steal_loc_A=false)
Compute parallel RAP operator and store it in A as a HypreParMatrix.
Definition: pbilinearform.cpp:124

AtomicAdd
MFEM_HOST_DEVICE T AtomicAdd(T &add, const T val)
Definition: backends.hpp:84

mfem::IntegrationRules
Container class for integration rules.
Definition: intrules.hpp:311

mfem::Mesh::GetNE
int GetNE() const
Returns number of elements.
Definition: mesh.hpp:923

mfem::Operator::Mult
virtual void Mult(const Vector &x, Vector &y) const =0
Operator application: y=A(x).

mfem::UsesTensorBasis
bool UsesTensorBasis(const FiniteElementSpace &fes)
Return true if the mesh contains only one topology and the elements are tensor elements.
Definition: fespace.hpp:957

mfem::SparseMatrix::GetMemoryData
Memory< double > & GetMemoryData()
Definition: sparsemat.hpp:269

mfem::BatchedLORAssembly::FormIsSupported
static bool FormIsSupported(BilinearForm &a)
Returns true if the form a supports batched assembly, false otherwise.
Definition: lor_batched.cpp:49

mfem::SparseMatrix::GetMemoryI
Memory< int > & GetMemoryI()
Definition: sparsemat.hpp:237

mfem::BatchedLORAssembly::FormLORVertexCoordinates
static void FormLORVertexCoordinates(FiniteElementSpace &fes_ho, Vector &X_vert)
Compute the vertices of the LOR mesh and place the result in X_vert.
Definition: lor_batched.cpp:72

mfem::SparseMatrix::GetMemoryJ
Memory< int > & GetMemoryJ()
Definition: sparsemat.hpp:253

mfem::HasIntegrators
bool HasIntegrators(BilinearForm &a)
Definition: lor_batched.cpp:27

mfem::FiniteElementSpace::GetNE
int GetNE() const
Returns number of elements in the mesh.
Definition: fespace.hpp:614

mfem::OperatorHandle::Is
OpType * Is() const
Return the Operator pointer dynamically cast to a specified OpType.
Definition: handle.hpp:108

mfem::SparseMatrix
Data type sparse matrix.
Definition: sparsemat.hpp:50

mfem::Operator::Height
int Height() const
Get the height (size of output) of the Operator. Synonym with NumRows().
Definition: operator.hpp:67

mfem::FiniteElementSpace::GetMesh
Mesh * GetMesh() const
Returns the mesh.
Definition: fespace.hpp:441

mfem::QuadratureInterpolator
A class that performs interpolation from an E-vector to quadrature point values and/or derivatives (Q...
Definition: quadinterpolator.hpp:29

mfem::Array
Definition: adios2stream.hpp:44

lor_h1.hpp

mfem::Device::GetDeviceMemoryType
static MemoryType GetDeviceMemoryType()
Get the current Device MemoryType. This is the MemoryType used by most MFEM classes when allocating m...
Definition: device.hpp:273

mfem::BatchedLORAssembly::sparse_ij
Vector sparse_ij
The elementwise LOR matrices in a sparse &quot;ij&quot; format.
Definition: lor_batched.hpp:45

mfem::BatchedLORAssembly::X_vert
Vector X_vert
LOR vertex coordinates.
Definition: lor_batched.hpp:38

mfem::BatchedLORAssembly::sparse_mapping
Array< int > sparse_mapping
The sparsity pattern of the element matrices.
Definition: lor_batched.hpp:54

mfem::FiniteElementSpace::GetMaxElementOrder
int GetMaxElementOrder() const
Return the maximum polynomial order.
Definition: fespace.hpp:459

mfem::Array::Read
const T * Read(bool on_dev=true) const
Shortcut for mfem::Read(a.GetMemory(), a.Size(), on_dev).
Definition: array.hpp:304

lor_rt.hpp

mfem::SparseMatrix::WriteI
int * WriteI(bool on_dev=true)
Definition: sparsemat.hpp:241

mfem::GridFunction::FESpace
FiniteElementSpace * FESpace()
Definition: gridfunc.hpp:668

mfem::Mesh::Dimension
int Dimension() const
Definition: mesh.hpp:1006

mfem::ElementRestriction::Offsets
const Array< int > & Offsets() const
Definition: restriction.hpp:63

mfem::BatchedLORAssembly::FillI
int FillI(SparseMatrix &A) const
Fill the I array of the sparse matrix A.
Definition: lor_batched.cpp:136

mfem::BatchedLORAssembly::FillJAndData
void FillJAndData(SparseMatrix &A) const
Fill the J and data arrays of the sparse matrix A.
Definition: lor_batched.cpp:229

lor_nd.hpp

mfem::BilinearFormIntegrator
Abstract base class BilinearFormIntegrator.
Definition: bilininteg.hpp:35

mfem::ElementRestriction
Operator that converts FiniteElementSpace L-vectors to E-vectors.
Definition: restriction.hpp:36

mfem::FiniteElementSpace
Class FiniteElementSpace - responsible for providing FEM view of the mesh, mainly managing the set of...
Definition: fespace.hpp:96

mfem::FiniteElement::GetDof
int GetDof() const
Returns the number of degrees of freedom in the finite element.
Definition: fe_base.hpp:323

mfem::FiniteElementCollection
Collection of finite elements from the same family in multiple dimensions. This class is used to matc...
Definition: fe_coll.hpp:26

mfem::BatchedLORAssembly::Assemble
void Assemble(BilinearForm &a, const Array< int > ess_dofs, OperatorHandle &A)
Assemble the given form as a matrix and place the result in A.
Definition: lor_batched.cpp:471

mfem::ElementRestriction::GatherMap
const Array< int > & GatherMap() const
Definition: restriction.hpp:61

mfem::Mesh::GetElementGeometry
Geometry::Type GetElementGeometry(int i) const
Definition: mesh.hpp:1055

mfem::SparseMatrix::ReadI
const int * ReadI(bool on_dev=true) const
Definition: sparsemat.hpp:239

mfem::SparseMatrix::WriteJ
int * WriteJ(bool on_dev=true)
Definition: sparsemat.hpp:257

a
double a
Definition: lissajous.cpp:41

mfem::BilinearForm
A &quot;square matrix&quot; operator for the associated FE space and BLFIntegrators The sum of all the BLFInteg...
Definition: bilinearform.hpp:60

mfem::Memory::New
void New(int size)
Allocate host memory for size entries with the current host memory type returned by MemoryManager::Ge...
Definition: mem_manager.hpp:855

mfem::FiniteElementSpace::GetQuadratureInterpolator
const QuadratureInterpolator * GetQuadratureInterpolator(const IntegrationRule &ir) const
Return a QuadratureInterpolator that interpolates E-vectors to quadrature point values and/or derivat...
Definition: fespace.cpp:1327

mfem::ElementDofOrdering
ElementDofOrdering
Constants describing the possible orderings of the DOFs in one element.
Definition: fespace.hpp:74

dim
int dim
Definition: ex24.cpp:53

lor_batched.hpp

mfem::FiniteElementSpace::GetFE
virtual const FiniteElement * GetFE(int i) const
Returns pointer to the FiniteElement in the FiniteElementCollection associated with i&#39;th element in t...
Definition: fespace.cpp:2781

mfem::SparseMatrix::OverrideSize
void OverrideSize(int height_, int width_)
Sets the height and width of the matrix.
Definition: sparsemat.cpp:297

mfem::ElementDofOrdering::LEXICOGRAPHIC
Lexicographic ordering for tensor-product FiniteElements.

mfem::ParBilinearForm
Class for parallel bilinear form.
Definition: pbilinearform.hpp:28

mfem::FiniteElementSpace::GetElementRestriction
const ElementRestrictionOperator * GetElementRestriction(ElementDofOrdering e_ordering) const
Return an Operator that converts L-vectors to E-vectors.
Definition: fespace.cpp:1259

mfem::BatchedLORAssembly::AssembleWithoutBC
void AssembleWithoutBC(BilinearForm &a, OperatorHandle &A)
Assemble the system without eliminating essential DOFs.
Definition: lor_batched.cpp:423

mfem::BatchedLORAssembly::SparseIJToCSR
void SparseIJToCSR(OperatorHandle &A) const
After assembling the &quot;sparse IJ&quot; format, convert it to CSR.
Definition: lor_batched.cpp:360

mfem::Vector
Vector data type.
Definition: vector.hpp:60

mfem::FiniteElementSpace::FEColl
const FiniteElementCollection * FEColl() const
Definition: fespace.hpp:601

mfem::Mesh::GetNodes
void GetNodes(Vector &node_coord) const
Definition: mesh.cpp:7908

mfem::BatchedLORAssembly::BatchedLORAssembly
BatchedLORAssembly(FiniteElementSpace &fes_ho_)
Construct the batched assembly object corresponding to fes_ho_.
Definition: lor_batched.cpp:488

mfem::SparseMatrix::HostReadWriteI
int * HostReadWriteI()
Definition: sparsemat.hpp:249

mfem::QuadratureInterpolator::SetOutputLayout
void SetOutputLayout(QVectorLayout layout) const
Set the desired output Q-vector layout. The default value is QVectorLayout::byNODES.
Definition: quadinterpolator.hpp:92

mfem::QuadratureInterpolator::Values
void Values(const Vector &e_vec, Vector &q_val) const
Interpolate the values of the E-vector e_vec at quadrature points.
Definition: quadinterpolator.cpp:611

mfem::Operator
Abstract operator.
Definition: operator.hpp:24

mfem::HypreParMatrix
Wrapper for hypre&#39;s ParCSR matrix class.
Definition: hypre.hpp:343

mfem::Vector::Read
virtual const double * Read(bool on_dev=true) const
Shortcut for mfem::Read(vec.GetMemory(), vec.Size(), on_dev).
Definition: vector.hpp:449

mfem::GetCollocatedIntRule
IntegrationRule GetCollocatedIntRule(FiniteElementSpace &fes)
Definition: lor_batched.cpp:494

mfem::SparseMatrix::EliminateBC
void EliminateBC(const Array< int > &ess_dofs, DiagonalPolicy diag_policy)
Eliminate essential (Dirichlet) boundary conditions.
Definition: sparsemat.cpp:2311

mfem::Mesh::EnsureNodes
void EnsureNodes()
Definition: mesh.cpp:5291

mfem::Reshape
MFEM_HOST_DEVICE DeviceTensor< sizeof...(Dims), T > Reshape(T *ptr, Dims...dims)
Wrap a pointer as a DeviceTensor with automatically deduced template parameters.
Definition: dtensor.hpp:131

mfem::OperatorHandle::Reset
void Reset(OpType *A, bool own_A=true)
Reset the OperatorHandle to the given OpType pointer, A.
Definition: handle.hpp:145

mfem::QVectorLayout::byVDIM
VDIM x NQPT x NE (values) / VDIM x DIM x NQPT x NE (grads)

mfem::Geometry::Type
Type
Definition: geom.hpp:35

mfem::SparseMatrix::WriteData
double * WriteData(bool on_dev=true)
Definition: sparsemat.hpp:273

mfem::BatchedLORAssembly::AssemblyKernel
void AssemblyKernel(BilinearForm &a)
Fill in sparse_ij and sparse_mapping using one of the specialized LOR assembly kernel classes...
Definition: lor_batched.cpp:384