html/hybridization__ext_8cpp_source.html

// Copyright (c) 2010-2025, Lawrence Livermore National Security, LLC. Produced

// at the Lawrence Livermore National Laboratory. All Rights reserved. See files

// LICENSE and NOTICE for details. LLNL-CODE-806117.

//

// This file is part of the MFEM library. For more information and source code

// availability visit https://mfem.org.

//

// MFEM is free software; you can redistribute it and/or modify it under the

// terms of the BSD-3 license. We welcome feedback and contributions, see file

// CONTRIBUTING.md for details.


#include "hybridization_ext.hpp"

#include "hybridization.hpp"

#include "pfespace.hpp"

#include "../general/forall.hpp"

#include "../linalg/batched/batched.hpp"

#include "../linalg/kernels.hpp"


namespace mfem

{


HybridizationExtension::HybridizationExtension(Hybridization &hybridization_)

   : h(hybridization_)

{ }


static int GetNFacesPerElement(const Mesh &mesh)

{

   const int dim = mesh.Dimension();

   switch (dim)

   {

      case 2: return mesh.GetElement(0)->GetNEdges();

      case 3: return mesh.GetElement(0)->GetNFaces();

      default: MFEM_ABORT("Invalid dimension.");

   }

}


void HybridizationExtension::ConstructC()

{

   Mesh &mesh = *h.fes.GetMesh();

   const int ne = mesh.GetNE();

   const int nf = mesh.GetNFbyType(FaceType::Interior);

   const int m = h.fes.GetFE(0)->GetDof(); // num hat dofs per el

   const int n = h.c_fes.GetFaceElement(0)->GetDof(); // num c dofs per face

   const int n_faces_per_el = GetNFacesPerElement(mesh);


   // Assemble Ct_mat using EA

   Vector emat(m * n * 2 * nf);

   h.c_bfi->AssembleEAInteriorFaces(h.c_fes, h.fes, emat, false);


   const auto *tbe = dynamic_cast<const TensorBasisElement*>(h.fes.GetFE(0));

   MFEM_VERIFY(tbe, "");

   // Note: copying the DOF map here (instead of using a reference) because

   // reading it on GPU can cause issues in other parts of the code when using

   // the debug device. The DOF map is accessed in other places without

   // explicitly calling HostRead, which fails on non-const access if the device

   // pointer is valid.

   Array<int> dof_map = tbe->GetDofMap();


   Ct_mat.SetSize(m * n * n_faces_per_el * ne);

   const auto d_emat = Reshape(emat.Read(), m, n, 2, nf);

   const int *d_dof_map = dof_map.Read();

   const auto d_face_to_el = Reshape(face_to_el.Read(), 2, 2, nf);

   auto d_Ct_mat = Reshape(Ct_mat.Write(), m, n, n_faces_per_el, ne);


   mfem::forall(Ct_mat.Size(), [=] MFEM_HOST_DEVICE (int i)

   {

      d_Ct_mat[i] = 0.0;

   });


   mfem::forall(m*n*2*nf, [=] MFEM_HOST_DEVICE (int idx)

   {

      const int i_lex = idx % m;

      const int j = (idx / m) % n;

      const int ie = (idx / m / n) % 2;

      const int f = idx / m / n / 2;


      const int e  = d_face_to_el(0, ie, f);

      const int fi = d_face_to_el(1, ie, f);


      // Skip elements belonging to face neighbors of shared faces

      if (e < ne)

      {

         // Convert to back to native MFEM ordering in the volume

         const int i_s = d_dof_map[i_lex];

         const int i = (i_s >= 0) ? i_s : -1 - i_s;

         d_Ct_mat(i, j, fi, e) = d_emat(i_lex, j, ie, f);

      }

   });

}


namespace internal

{

template <typename T, int SIZE>

struct LocalMemory

{

   T data[SIZE];

   MFEM_HOST_DEVICE inline operator T *() const { return (T*)data; }

};


template <typename T>

struct LocalMemory<T,0>

{

   MFEM_HOST_DEVICE inline operator T *() const { return (T*)nullptr; }

};

};


template <int MID, int MBD>


void HybridizationExtension::FactorElementMatrices(Vector &AhatInvCt_mat)

{

   const Mesh &mesh = *h.fes.GetMesh();

   const int ne = mesh.GetNE();

   const int n_faces_per_el = GetNFacesPerElement(mesh);

   const int m = h.fes.GetFE(0)->GetDof();

   const int n = h.c_fes.GetFaceElement(0)->GetDof();


   AhatInvCt_mat.SetSize(Ct_mat.Size());

   auto d_AhatInvCt = Reshape(AhatInvCt_mat.Write(), m, n, n_faces_per_el, ne);


   {

      const int nidofs = idofs.Size();

      const int nbdofs = bdofs.Size();


      MFEM_VERIFY(nidofs <= MID, "");

      MFEM_VERIFY(nbdofs <= MBD, "");


      Ahat_ii.SetSize(nidofs*nidofs*ne);

      Ahat_ib.SetSize(nidofs*nbdofs*ne);

      Ahat_bi.SetSize(nbdofs*nidofs*ne);

      Ahat_bb.SetSize(nbdofs*nbdofs*ne);


      Ahat_ii_piv.SetSize(nidofs*ne);

      Ahat_bb_piv.SetSize(nbdofs*ne);


      const auto *d_idofs = idofs.Read();

      const auto *d_bdofs = bdofs.Read();


      const auto d_hat_dof_marker = Reshape(hat_dof_marker.Read(), m, ne);

      auto d_Ahat = Reshape(Ahat.Read(), m, m, ne);


      auto d_A_ii = Reshape(Ahat_ii.Write(), nidofs, nidofs, ne);

      auto d_A_ib_all = Reshape(Ahat_ib.Write(), nidofs*nbdofs, ne);

      auto d_A_bi_all = Reshape(Ahat_bi.Write(), nbdofs*nidofs, ne);

      auto d_A_bb_all = Reshape(Ahat_bb.Write(), nbdofs*nbdofs, ne);


      auto d_ipiv_ii = Reshape(Ahat_ii_piv.Write(), nidofs, ne);

      auto d_ipiv_bb = Reshape(Ahat_bb_piv.Write(), nbdofs, ne);


      const auto d_Ct_mat = Reshape(Ct_mat.Read(), m, n, n_faces_per_el, ne);


      static constexpr bool GLOBAL = (MID == 0 && MBD == 0);


      using internal::LocalMemory;


      mfem::forall(ne, [=] MFEM_HOST_DEVICE (int e)

      {

         constexpr int MD1D = DofQuadLimits::HDIV_MAX_D1D;

         constexpr int MAX_DOFS = 3*MD1D*(MD1D-1)*(MD1D-1);

         constexpr int MAX_IDOFS = (MID == 0 && MBD == 0) ? MAX_DOFS : MID;

         constexpr int MAX_BDOFS = (MID == 0 && MBD == 0) ? MAX_DOFS : MBD;


         LocalMemory<int,MAX_IDOFS> idofs_loc;

         LocalMemory<int,MAX_BDOFS> bdofs_loc;

         for (int i = 0; i < nidofs; i++) { idofs_loc[i] = d_idofs[i]; }

         for (int i = 0; i < nbdofs; i++) { bdofs_loc[i] = d_bdofs[i]; }


         LocalMemory<int,MAX_BDOFS> essdofs_loc;

         int nbfdofs = 0;

         int nessdofs = 0;

         for (int i = 0; i < nbdofs; i++)

         {

            const int dof_idx = bdofs_loc[i];

            if (d_hat_dof_marker(dof_idx, e) == ESSENTIAL)

            {

               essdofs_loc[nessdofs] = dof_idx;

               nessdofs += 1;

            }

            else

            {

               bdofs_loc[nbfdofs] = dof_idx;

               nbfdofs += 1;

            }

         }


         LocalMemory<real_t, MID*MID> A_ii_loc;

         LocalMemory<real_t, MBD*MID> A_bi_loc;

         LocalMemory<real_t, MID*MBD> A_ib_loc;

         LocalMemory<real_t, MBD*MBD> A_bb_loc;


         DeviceMatrix A_ii(GLOBAL ? &d_A_ii(0,0,e) : A_ii_loc, nidofs, nidofs);

         DeviceMatrix A_ib(GLOBAL ? &d_A_ib_all(0,e) : A_ib_loc, nidofs, nbfdofs);

         DeviceMatrix A_bi(GLOBAL ? &d_A_bi_all(0,e) : A_bi_loc, nbfdofs, nidofs);

         DeviceMatrix A_bb(GLOBAL ? &d_A_bb_all(0,e) : A_bb_loc, nbfdofs, nbfdofs);


         for (int j = 0; j < nidofs; j++)

         {

            const int jj = idofs_loc[j];

            for (int i = 0; i < nidofs; i++)

            {

               A_ii(i,j) = d_Ahat(idofs_loc[i], jj, e);

            }

            for (int i = 0; i < nbfdofs; i++)

            {

               A_bi(i,j) = d_Ahat(bdofs_loc[i], jj, e);

            }

         }

         for (int j = 0; j < nbfdofs; j++)

         {

            const int jj = bdofs_loc[j];

            for (int i = 0; i < nidofs; i++)

            {

               A_ib(i,j) = d_Ahat(idofs_loc[i], jj, e);

            }

            for (int i = 0; i < nbfdofs; i++)

            {

               A_bb(i,j) = d_Ahat(bdofs_loc[i], jj, e);

            }

         }


         LocalMemory<int,MID> ipiv_ii_loc;

         LocalMemory<int,MBD> ipiv_bb_loc;


         auto ipiv_ii = GLOBAL ? &d_ipiv_ii(0,e) : ipiv_ii_loc;

         auto ipiv_bb = GLOBAL ? &d_ipiv_ii(0,e) : ipiv_bb_loc;


         kernels::LUFactor(A_ii, nidofs, ipiv_ii);

         kernels::BlockFactor(A_ii, nidofs, ipiv_ii, nbfdofs, A_ib, A_bi, A_bb);

         kernels::LUFactor(A_bb, nbfdofs, ipiv_bb);


         for (int f = 0; f < n_faces_per_el; ++f)

         {

            for (int j = 0; j < n; ++j)

            {

               LocalMemory<real_t,MAX_BDOFS> Sb_inv_Cb_t;

               for (int i = 0; i < nbfdofs; ++i)

               {

                  Sb_inv_Cb_t[i] = d_Ct_mat(bdofs_loc[i], j, f, e);

               }

               kernels::LUSolve(A_bb, nbfdofs, ipiv_bb, Sb_inv_Cb_t);

               for (int i = 0; i < nbfdofs; ++i)

               {

                  const int b_i = bdofs_loc[i];

                  d_AhatInvCt(b_i, j, f, e) = Sb_inv_Cb_t[i];

               }

               for (int i = 0; i < nidofs; ++i)

               {

                  d_AhatInvCt(idofs_loc[i], j, f, e) = 0.0;

               }

               for (int i = 0; i < nessdofs; ++i)

               {

                  d_AhatInvCt(essdofs_loc[i], j, f, e) = 0.0;

               }

            }

         }


         // Write out to global memory

         if (!GLOBAL)

         {

            // Note: in the following constructors, avoid using index 0 in

            //       d_A_{bi,ib,bb}_all when their size is 0.

            DeviceMatrix d_A_bi((nbfdofs && nidofs) ?

                                &d_A_bi_all(0,e) : nullptr,

                                nbfdofs, nidofs);

            DeviceMatrix d_A_ib((nbfdofs && nidofs) ?

                                &d_A_ib_all(0,e) : nullptr,

                                nidofs, nbfdofs);

            DeviceMatrix d_A_bb((nbfdofs) ? &d_A_bb_all(0,e) : nullptr,

                                nbfdofs, nbfdofs);


            for (int j = 0; j < nidofs; j++)

            {

               d_ipiv_ii(j,e) = ipiv_ii[j];

               for (int i = 0; i < nidofs; i++)

               {

                  d_A_ii(i,j,e) = A_ii(i,j);

               }

               for (int i = 0; i < nbfdofs; i++)

               {

                  d_A_bi(i,j) = A_bi(i,j);

               }

            }

            for (int j = 0; j < nbfdofs; j++)

            {

               d_ipiv_bb(j,e) = ipiv_bb[j];

               for (int i = 0; i < nidofs; i++)

               {

                  d_A_ib(i,j) = A_ib(i,j);

               }

               for (int i = 0; i < nbfdofs; i++)

               {

                  d_A_bb(i,j) = A_bb(i,j);

               }

            }

         }

      });

   }

}


void HybridizationExtension::ConstructH()

{

   const Mesh &mesh = *h.fes.GetMesh();

   const int ne = mesh.GetNE();

   const int n_faces_per_el = GetNFacesPerElement(mesh);

   const int m = h.fes.GetFE(0)->GetDof();

   const int n = h.c_fes.GetFaceElement(0)->GetDof();


   Vector AhatInvCt_mat;


   {

      // The dispatch below is based on the following sizes, sorted

      // appropriately.

      //

      // RT(k) in 2D (quads): (interior,boundary) dofs:

      // - arbitrary k: 2*(k+1)*(k+2)-4*(k+1), 4*(k+1)

      // - k=0: (0,4)

      // - k=1: (4,8)

      // - k=2: (12,12)

      // - k=3: (24,16)

      // RT(k) in 3D (hexes): (interior,boundary) dofs:

      // - arbitrary k: 3*(k+1)^2*(k+2)-6*(k+1)^2, 6*(k+1)^2

      // - k=0: (0,6)

      // - k=1: (12,24)

      // - k=2: (54,54)

      const int NI = idofs.Size();

      const int NB = bdofs.Size();

      if (NI == 0 && NB <= 4) { FactorElementMatrices<0,4>(AhatInvCt_mat); }

      else if (NI == 0 && NB <= 6) { FactorElementMatrices<0,6>(AhatInvCt_mat); }

      else if (NI <= 4 && NB <= 8) { FactorElementMatrices<4,8>(AhatInvCt_mat); }

      else if (NI <= 12 && NB <= 12) { FactorElementMatrices<12,12>(AhatInvCt_mat); }

      else if (NI <= 12 && NB <= 24) { FactorElementMatrices<12,24>(AhatInvCt_mat); }

      else if (NI <= 24 && NB <= 16) { FactorElementMatrices<24,16>(AhatInvCt_mat); }

      else if (NI <= 54 && NB <= 54) { FactorElementMatrices<54,54>(AhatInvCt_mat); }

      // Fallback

      else { FactorElementMatrices<0,0>(AhatInvCt_mat); }

   }


   const auto d_AhatInvCt =

      Reshape(AhatInvCt_mat.Read(), m, n, n_faces_per_el, ne);


   const int nf = h.fes.GetNFbyType(FaceType::Interior);

   const int n_face_connections = 2*n_faces_per_el - 1;

   Array<int> face_to_face(nf * n_face_connections);


   Array<real_t> CAhatInvCt(nf*n_face_connections*n*n);


   const auto d_Ct = Reshape(Ct_mat.Read(), m, n, n_faces_per_el, ne);

   const auto d_face_to_el = Reshape(face_to_el.Read(), 2, 2, nf);

   const auto d_el_to_face = Reshape(el_to_face.Read(), n_faces_per_el, ne);

   auto d_CAhatInvCt = Reshape(CAhatInvCt.Write(), n, n, n_face_connections, nf);

   auto d_face_to_face = Reshape(face_to_face.Write(), n_face_connections, nf);


   mfem::forall(n*n*n_face_connections*nf, [=] MFEM_HOST_DEVICE (int i)

   {

      d_CAhatInvCt[i] = 0.0;

   });


   mfem::forall(nf, [=] MFEM_HOST_DEVICE (int fi)

   {

      int idx = 0;

      for (int ei = 0; ei < 2; ++ei)

      {

         const int e = d_face_to_el(0, ei, fi);

         if (e < 0 || e >= ne) { continue; }

         for (int fj_i = 0; fj_i < n_faces_per_el; ++fj_i)

         {

            const int fj = d_el_to_face(fj_i, e);

            // Explicitly allow fi == fj (self-connections)

            if (fj < 0) { continue; }


            // Have we seen this face before? It is possible in some

            // configurations to encounter the same neighboring face twice

            int idx_j = idx;

            for (int i = 0; i < idx; ++i)

            {

               if (d_face_to_face(i, fi) == fj)

               {

                  idx_j = i;

                  break;

               }

            }

            // This is a new face, record it and increment the counter

            if (idx_j == idx)

            {

               d_face_to_face(idx, fi) = fj;

               idx++;

            }

         }

      }

      // Fill unused entries with -1 to indicate invalid

      for (; idx < n_face_connections; ++idx)

      {

         d_face_to_face(idx, fi) = -1;

      }

   });


   mfem::forall(nf*n_face_connections, [=] MFEM_HOST_DEVICE (int idx)

   {

      const int idx_j = idx % n_face_connections;

      const int fi = idx / n_face_connections;


      const int fj = d_face_to_face(idx_j, fi);

      if (fj < 0) { return; }


      for (int ei = 0; ei < 2; ++ei)

      {

         const int e = d_face_to_el(0, ei, fi);

         if (e < 0 || e >= ne) { continue; }

         const int fi_i = d_face_to_el(1, ei, fi);


         int fj_i = -1;

         for (int ej = 0; ej < 2; ++ej)

         {

            if (d_face_to_el(0, ej, fj) == e)

            {

               fj_i = d_face_to_el(1, ej, fj);

               break;

            }

         }

         if (fj_i >= 0)

         {

            const real_t *Ct_i = &d_Ct(0, 0, fi_i, e);

            const real_t *AhatInvCt_i = &d_AhatInvCt(0, 0, fj_i, e);

            real_t *CAhatInvCt_i = &d_CAhatInvCt(0, 0, idx_j, fi);

            kernels::AddMultAtB(m, n, n, Ct_i, AhatInvCt_i, CAhatInvCt_i);

         }

      }

   });


   const int ncdofs = h.c_fes.GetVSize();

   const ElementDofOrdering ordering = ElementDofOrdering::NATIVE;

   const FaceRestriction *face_restr =

      h.c_fes.GetFaceRestriction(ordering, FaceType::Interior);

   const auto c_gather_map = Reshape(face_restr->GatherMap().Read(), n, nf);


   h.H.reset(new SparseMatrix);

   h.H->OverrideSize(ncdofs, ncdofs);


   h.H->GetMemoryI().New(ncdofs + 1, h.H->GetMemoryI().GetMemoryType());


   {

      int *I = h.H->WriteI();


      mfem::forall(ncdofs, [=] MFEM_HOST_DEVICE (int i) { I[i] = 0; });


      mfem::forall(nf*n, [=] MFEM_HOST_DEVICE (int idx_i)

      {

         const int i = idx_i % n;

         const int fi = idx_i / n;

         const int ii = c_gather_map(i, fi);


         for (int idx = 0; idx < n_face_connections; ++idx)

         {

            const int fj = d_face_to_face(idx, fi);

            if (fj < 0) { break; }

            for (int j = 0; j < n; ++j)

            {

               if (d_CAhatInvCt(i, j, idx, fi) != 0)

               {

                  I[ii]++;

               }

            }

         }

      });

   }


   // At this point, I[i] contains the number of nonzeros in row I. Perform a

   // partial sum to get I in CSR format. This is serial, so perform on host.

   //

   // At the same time, we find any empty rows and add a single nonzero (we will

   // put 1 on the diagonal) and record the row index.

   Array<int> empty_rows;

   {

      int *I = h.H->HostReadWriteI();

      int empty_row_count = 0;

      for (int i = 0; i < ncdofs; i++)

      {

         if (I[i] == 0) { empty_row_count++; }

      }

      empty_rows.SetSize(empty_row_count);


      int empty_row_idx = 0;

      int sum = 0;

      for (int i = 0; i < ncdofs; i++)

      {

         int nnz = I[i];

         if (nnz == 0)

         {

            empty_rows[empty_row_idx] = i;

            empty_row_idx++;

            nnz = 1;

         }

         I[i] = sum;

         sum += nnz;

      }

      I[ncdofs] = sum;

   }


   const int nnz = h.H->HostReadI()[ncdofs];

   h.H->GetMemoryJ().New(nnz, h.H->GetMemoryJ().GetMemoryType());

   h.H->GetMemoryData().New(nnz, h.H->GetMemoryData().GetMemoryType());


   {

      int *I = h.H->ReadWriteI();

      int *J = h.H->WriteJ();

      real_t *V = h.H->WriteData();


      mfem::forall(nf*n, [=] MFEM_HOST_DEVICE (int idx_i)

      {

         const int i = idx_i % n;

         const int fi = idx_i / n;

         const int ii = c_gather_map[i + fi*n];

         for (int idx = 0; idx < n_face_connections; ++idx)

         {

            const int fj = d_face_to_face(idx, fi);

            if (fj < 0) { break; }

            for (int j = 0; j < n; ++j)

            {

               const real_t val = d_CAhatInvCt(i, j, idx, fi);

               if (val != 0)

               {

                  const int k = I[ii];

                  const int jj = c_gather_map(j, fj);

                  I[ii]++;

                  J[k] = jj;

                  V[k] = val;

               }

            }

         }

      });


      const int *d_empty_rows = empty_rows.Read();

      mfem::forall(empty_rows.Size(), [=] MFEM_HOST_DEVICE (int idx)

      {

         const int i = d_empty_rows[idx];

         const int k = I[i];

         I[i]++;

         J[k] = i;

         V[k] = 1.0;

      });

   }


   // Shift back down (serial, done on host)

   {

      int *I = h.H->HostReadWriteI();

      for (int i = ncdofs - 1; i > 0; --i)

      {

         I[i] = I[i-1];

      }

      I[0] = 0;

   }


#ifdef MFEM_USE_MPI

   auto *c_pfes = dynamic_cast<ParFiniteElementSpace*>(&h.c_fes);

   if (c_pfes)

   {

      OperatorHandle pP(h.pH.Type()), dH(h.pH.Type());

      pP.ConvertFrom(c_pfes->Dof_TrueDof_Matrix());

      dH.MakeSquareBlockDiag(c_pfes->GetComm(),c_pfes->GlobalVSize(),

                             c_pfes->GetDofOffsets(), h.H.get());

      h.pH.MakePtAP(dH, pP);

      h.H.reset();

   }

#endif

}


void HybridizationExtension::MultCt(const Vector &x, Vector &y) const

{

   Mesh &mesh = *h.fes.GetMesh();

   const int ne = mesh.GetNE();

   const int nf = mesh.GetNFbyType(FaceType::Interior);


   const int n_hat_dof_per_el = h.fes.GetFE(0)->GetDof();

   const int n_c_dof_per_face = h.c_fes.GetFaceElement(0)->GetDof();

   const int n_faces_per_el = GetNFacesPerElement(mesh);


   const ElementDofOrdering ordering = ElementDofOrdering::NATIVE;

   const FaceRestriction *face_restr =

      h.c_fes.GetFaceRestriction(ordering, FaceType::Interior);


   Vector x_evec(face_restr->Height());

   face_restr->Mult(x, x_evec);


   const int *d_el_to_face = el_to_face.Read();

   const auto d_Ct = Reshape(Ct_mat.Read(), n_hat_dof_per_el, n_c_dof_per_face,

                             n_faces_per_el, ne);

   const auto d_x_evec = Reshape(x_evec.Read(), n_c_dof_per_face, nf);

   auto d_y = Reshape(y.Write(), n_hat_dof_per_el, ne);


   mfem::forall(ne * n_hat_dof_per_el, [=] MFEM_HOST_DEVICE (int idx)

   {

      const int e = idx / n_hat_dof_per_el;

      const int i = idx % n_hat_dof_per_el;

      d_y(i, e) = 0.0;

      for (int fi = 0; fi < n_faces_per_el; ++fi)

      {

         const int f = d_el_to_face[e*n_faces_per_el + fi];

         if (f < 0) { continue; }

         for (int j = 0; j < n_c_dof_per_face; ++j)

         {

            d_y(i, e) += d_Ct(i, j, fi, e)*d_x_evec(j, f);

         }

      }

   });

}


void HybridizationExtension::MultC(const Vector &x, Vector &y) const

{

   Mesh &mesh = *h.fes.GetMesh();

   const int ne = mesh.GetNE();

   const int nf = mesh.GetNFbyType(FaceType::Interior);


   const int n_hat_dof_per_el = h.fes.GetFE(0)->GetDof();

   const int n_c_dof_per_face = h.c_fes.GetFaceElement(0)->GetDof();

   const int n_faces_per_el = GetNFacesPerElement(mesh);


   const ElementDofOrdering ordering = ElementDofOrdering::NATIVE;

   const FaceRestriction *face_restr = h.c_fes.GetFaceRestriction(

                                          ordering, FaceType::Interior);


   Vector y_evec(face_restr->Height());

   const auto d_face_to_el = Reshape(face_to_el.Read(), 2, 2, nf);

   const auto d_Ct = Reshape(Ct_mat.Read(), n_hat_dof_per_el, n_c_dof_per_face,

                             n_faces_per_el, ne);

   auto d_x = Reshape(x.Read(), n_hat_dof_per_el, ne);

   auto d_y_evec = Reshape(y_evec.Write(), n_c_dof_per_face, nf);


   mfem::forall(nf * n_c_dof_per_face, [=] MFEM_HOST_DEVICE (int idx)

   {

      const int f = idx / n_c_dof_per_face;

      const int j = idx % n_c_dof_per_face;

      d_y_evec(j, f) = 0.0;

      for (int el_i = 0; el_i < 2; ++el_i)

      {

         const int e = d_face_to_el(0, el_i, f);

         const int fi = d_face_to_el(1, el_i, f);


         // Skip face neighbor elements of shared faces

         if (e >= ne) { continue; }


         for (int i = 0; i < n_hat_dof_per_el; ++i)

         {

            d_y_evec(j, f) += d_Ct(i, j, fi, e)*d_x(i, e);

         }

      }

   });


   y.SetSize(face_restr->Width());

   face_restr->MultTranspose(y_evec, y);

}


void HybridizationExtension::AssembleMatrix(int el, const DenseMatrix &elmat)

{

   const int n = elmat.Width();

   const real_t *d_elmat = elmat.Read();

   real_t *d_Ahat = Ahat.ReadWrite();

   const int offset = el*n*n;

   mfem::forall(n*n, [=] MFEM_HOST_DEVICE (int i)

   {

      d_Ahat[offset + i] += d_elmat[i];

   });

}


void HybridizationExtension::AssembleBdrMatrix(int bdr_el,

                                               const DenseMatrix &elmat)

{

   DenseMatrix B = elmat; // deep copy

   const int n = h.fes.GetFE(0)->GetDof();

   // Create mapping e2f from element DOF indices to face DOF indices

   Array<int> e2f(n);

   e2f = -1;

   int el;

   {

      Mesh &mesh = *h.fes.GetMesh();

      int info;

      mesh.GetBdrElementAdjacentElement(bdr_el, el, info);

      Array<int> lvdofs;

      lvdofs.Reserve(elmat.Height());

      h.fes.FEColl()->SubDofOrder(mesh.GetElementGeometry(el),

                                  mesh.Dimension() - 1, info, lvdofs);

      // Convert local element dofs to local element vdofs.

      const int vdim = h.fes.GetVDim();

      Ordering::DofsToVDofs<Ordering::byNODES>(n/vdim, vdim, lvdofs);

      MFEM_ASSERT(lvdofs.Size() == elmat.Height(), "internal error");


      B.AdjustDofDirection(lvdofs);

      FiniteElementSpace::AdjustVDofs(lvdofs);

      // Create a map from local element vdofs to local boundary (face) vdofs.

      for (int i = 0; i < lvdofs.Size(); i++)

      {

         e2f[lvdofs[i]] = i;

      }

   }


   const int offset = el*n*n;

   Ahat.HostReadWrite();

   for (int j = 0; j < n; ++j)

   {

      const int j_f = e2f[j];

      if (j_f < 0) { continue; }

      for (int i = 0; i < n; ++i)

      {

         const int i_f = e2f[i];

         if (i_f < 0) { continue; }

         Ahat[offset + i + j*n] += B(i_f, j_f);

      }

   }

}


void HybridizationExtension::AssembleElementMatrices(const DenseTensor &elmats)

{

   const real_t *d_elmats = elmats.Read();

   real_t *d_Ahat = Ahat.ReadWrite();

   mfem::forall(elmats.TotalSize(), [=] MFEM_HOST_DEVICE (int i)

   {

      d_Ahat[i] += d_elmats[i];

   });

}


void HybridizationExtension::Init(const Array<int> &ess_tdof_list)

{

   // Verify that preconditions for the extension are met

   const Mesh &mesh = *h.fes.GetMesh();

   const int dim = mesh.Dimension();

   const int ne = h.fes.GetNE();

   const int ndof_per_el = h.fes.GetFE(0)->GetDof();

   const int ndof_per_face = h.c_fes.GetFaceElement(0)->GetDof();


   MFEM_VERIFY(!h.fes.IsVariableOrder(), "");

   MFEM_VERIFY(dim == 2 || dim == 3, "");

   MFEM_VERIFY(mesh.Conforming(), "");

   MFEM_VERIFY(UsesTensorBasis(h.fes), "");


   // Set up array for idofs and bdofs

   {

      const TensorBasisElement* tbe =

         dynamic_cast<const TensorBasisElement*>(h.fes.GetFE(0));

      MFEM_VERIFY(tbe != nullptr, "");

      const Array<int> &dof_map = tbe->GetDofMap();


      const int n_faces_per_el = GetNFacesPerElement(mesh);


      Array<int> all_face_dofs;

      for (int f = 0; f < n_faces_per_el; ++f)

      {

         Array<int> face_map(ndof_per_face);

         h.fes.GetFE(0)->GetFaceMap(f, face_map);

         all_face_dofs.Append(face_map);

      }


      Array<bool> b_marker(ndof_per_el);

      b_marker = false;

      for (int i = 0; i < all_face_dofs.Size(); ++i)

      {

         const int j_s = all_face_dofs[i];

         const int j = (j_s >= 0) ? j_s : -1 - j_s;

         const int j_nat_s = dof_map[j];

         const int j_nat = (j_nat_s >= 0) ? j_nat_s : -1 - j_nat_s;

         b_marker[j_nat] = true;

      }


      for (int i = 0; i < ndof_per_el; ++i)

      {

         if (b_marker[i]) { bdofs.Append(i); }

         else { idofs.Append(i); }

      }

   }


   // Set up face info arrays

   const int n_faces_per_el = GetNFacesPerElement(mesh);

   el_to_face.SetSize(ne * n_faces_per_el);

   face_to_el.SetSize(4 * mesh.GetNFbyType(FaceType::Interior));

   el_to_face = -1;


   {

      int face_idx = 0;

      for (int f = 0; f < mesh.GetNumFaces(); ++f)

      {

         const Mesh::FaceInformation info = mesh.GetFaceInformation(f);

         if (!info.IsInterior()) { continue; }


         const int el1 = info.element[0].index;

         const int fi1 = info.element[0].local_face_id;

         el_to_face[el1 * n_faces_per_el + fi1] = face_idx;


         const int el2 = info.element[1].index;

         const int fi2 = info.element[1].local_face_id;

         if (!info.IsShared())

         {

            el_to_face[el2 * n_faces_per_el + fi2] = face_idx;

         }


         face_to_el[0 + 4*face_idx] = el1;

         face_to_el[1 + 4*face_idx] = fi1;

         face_to_el[2 + 4*face_idx] = info.IsShared() ? ne + el2 : el2;

         face_to_el[3 + 4*face_idx] = fi2;


         ++face_idx;

      }

   }


   // Count the number of dofs in the discontinuous version of fes:

   num_hat_dofs = ne*ndof_per_el;

   {

      h.hat_offsets.SetSize(ne + 1);

      int *d_hat_offsets = h.hat_offsets.Write();

      mfem::forall(ne + 1, [=] MFEM_HOST_DEVICE (int i)

      {

         d_hat_offsets[i] = i*ndof_per_el;

      });

   }


   Ahat.SetSize(ne*ndof_per_el*ndof_per_el);

   Ahat.UseDevice(true);

   Ahat = 0.0;


   ConstructC();


   const ElementDofOrdering ordering = ElementDofOrdering::NATIVE;

   const Operator *R_op = h.fes.GetElementRestriction(ordering);

   const auto *R = dynamic_cast<const ElementRestriction*>(R_op);

   MFEM_VERIFY(R, "");


   // Find out which "hat DOFs" are essential (depend only on essential Lagrange

   // multiplier DOFs).

   {

      const int ntdofs = h.fes.GetTrueVSize();

      // free_tdof_marker is 1 if the DOF is free, 0 if the DOF is essential

      Array<int> free_tdof_marker(ntdofs);

      {

         int *d_free_tdof_marker = free_tdof_marker.Write();

         mfem::forall(ntdofs, [=] MFEM_HOST_DEVICE (int i)

         {

            d_free_tdof_marker[i] = 1;

         });

         const int n_ess_dofs = ess_tdof_list.Size();

         const int *d_ess_tdof_list = ess_tdof_list.Read();

         mfem::forall(n_ess_dofs, [=] MFEM_HOST_DEVICE (int i)

         {

            d_free_tdof_marker[d_ess_tdof_list[i]] = 0;

         });

      }


      Array<int> free_vdofs_marker;

#ifdef MFEM_USE_MPI

      auto *pfes = dynamic_cast<ParFiniteElementSpace*>(&h.fes);

      if (pfes)

      {

         HypreParMatrix *P = pfes->Dof_TrueDof_Matrix();

         free_vdofs_marker.SetSize(h.fes.GetVSize());

         // TODO: would be nice to do this on device

         P->BooleanMult(1, free_tdof_marker.HostRead(),

                        0, free_vdofs_marker.HostWrite());

      }

      else

      {

         free_vdofs_marker.MakeRef(free_tdof_marker);

      }

#else

      free_vdofs_marker.MakeRef(free_tdof_marker);

#endif


      hat_dof_marker.SetSize(num_hat_dofs);

      {

         // The gather map from the ElementRestriction operator gives us the

         // index of the L-dof corresponding to a given (element, local DOF)

         // index pair.

         const int *gather_map = R->GatherMap().Read();

         const int *d_free_vdofs_marker = free_vdofs_marker.Read();

         const auto d_Ct_mat = Reshape(Ct_mat.Read(), ndof_per_el,

                                       ndof_per_face, n_faces_per_el, ne);

         DofType *d_hat_dof_marker = hat_dof_marker.Write();


         // Set the hat_dofs_marker to 1 or 0 according to whether the DOF is

         // "free" or "essential". (For now, we mark all free DOFs as free

         // interior as a placeholder). Then, as a later step, the "free" DOFs

         // will be further classified as "interior free" or "boundary free".

         mfem::forall(num_hat_dofs, [=] MFEM_HOST_DEVICE (int i)

         {

            const int j_s = gather_map[i];

            const int j = (j_s >= 0) ? j_s : -1 - j_s;

            if (d_free_vdofs_marker[j])

            {

               const int i_loc = i % ndof_per_el;

               const int e = i / ndof_per_el;

               d_hat_dof_marker[i] = INTERIOR;

               for (int f = 0; f < n_faces_per_el; ++f)

               {

                  for (int k = 0; k < ndof_per_face; ++k)

                  {

                     if (d_Ct_mat(i_loc, k, f, e) != 0.0)

                     {

                        d_hat_dof_marker[i] = BOUNDARY;

                        break;

                     }

                  }

               }

            }

            else

            {

               d_hat_dof_marker[i] = ESSENTIAL;

            }

         });

      }

   }


   // Create the hat DOF gather map. This is used to apply the action of R and

   // R^T

   {

      const int vsize = h.fes.GetVSize();

      hat_dof_gather_map.SetSize(num_hat_dofs);

      const int *d_offsets = R->Offsets().Read();

      const int *d_indices = R->Indices().Read();

      int *d_hat_dof_gather_map = hat_dof_gather_map.Write();

      mfem::forall(num_hat_dofs, [=] MFEM_HOST_DEVICE (int i)

      {

         d_hat_dof_gather_map[i] = -1;

      });

      mfem::forall(vsize, [=] MFEM_HOST_DEVICE (int i)

      {

         const int offset = d_offsets[i];

         const int j_s = d_indices[offset];

         const int hat_dof_index = (j_s >= 0) ? j_s : -1 - j_s;

         // Note: -1 is used as a special value (invalid), so the negative

         // DOF indices start at -2.

         d_hat_dof_gather_map[hat_dof_index] = (j_s >= 0) ? i : (-2 - i);

      });

   }

}


void HybridizationExtension::MultR(const Vector &x_hat, Vector &x) const

{

   const Operator *R = h.fes.GetRestrictionOperator();


   // If R is null, then L-vector and T-vector are the same, and we don't need

   // an intermediate temporary variable.

   //

   // If R is not null, we first convert to intermediate L-vector (with the

   // correct BCs), and then from L-vector to T-vector.

   if (!R)

   {

      MFEM_ASSERT(x.Size() == h.fes.GetVSize(), "");

      tmp2.MakeRef(x, 0);

   }

   else

   {

      tmp2.SetSize(R->Width());

      R->MultTranspose(x, tmp2);

   }


   const ElementDofOrdering ordering = ElementDofOrdering::NATIVE;

   const auto *restr = static_cast<const ElementRestriction*>(

                          h.fes.GetElementRestriction(ordering));

   const int *gather_map = restr->GatherMap().Read();

   const DofType *d_hat_dof_marker = hat_dof_marker.Read();

   const real_t *d_evec = x_hat.Read();

   real_t *d_lvec = tmp2.ReadWrite();

   mfem::forall(num_hat_dofs, [=] MFEM_HOST_DEVICE (int i)

   {

      // Skip essential DOFs

      if (d_hat_dof_marker[i] == ESSENTIAL) { return; }


      const int j_s = gather_map[i];

      const int sgn = (j_s >= 0) ? 1 : -1;

      const int j = (j_s >= 0) ? j_s : -1 - j_s;


      d_lvec[j] = sgn*d_evec[i];

   });


   // Convert from L-vector to T-vector.

   if (R) { R->Mult(tmp2, x); }

}


void HybridizationExtension::MultRt(const Vector &b, Vector &b_hat) const

{

   Vector b_lvec;

   const Operator *R = h.fes.GetRestrictionOperator();

   if (!R)

   {

      b_lvec.MakeRef(const_cast<Vector&>(b), 0, b.Size());

   }

   else

   {

      tmp1.SetSize(h.fes.GetVSize());

      b_lvec.MakeRef(tmp1, 0, tmp1.Size());

      R->MultTranspose(b, b_lvec);

   }


   b_hat.SetSize(num_hat_dofs);

   const int *d_hat_dof_gather_map = hat_dof_gather_map.Read();

   const real_t *d_b_lvec = b_lvec.Read();

   real_t *d_b_hat = b_hat.Write();

   mfem::forall(num_hat_dofs, [=] MFEM_HOST_DEVICE (int i)

   {

      const int j_s = d_hat_dof_gather_map[i];

      if (j_s == -1) // invalid

      {

         d_b_hat[i] = 0.0;

      }

      else

      {

         const int sgn = (j_s >= 0) ? 1 : -1;

         const int j = (j_s >= 0) ? j_s : -2 - j_s;

         d_b_hat[i] = sgn*d_b_lvec[j];

      }

   });

}


void HybridizationExtension::MultAhatInv(Vector &x) const

{

   const int ne = h.fes.GetMesh()->GetNE();

   const int n = h.fes.GetFE(0)->GetDof();


   const int nidofs = idofs.Size();

   const int nbdofs = bdofs.Size();


   const auto d_hat_dof_marker = Reshape(hat_dof_marker.Read(), n, ne);


   const auto d_A_ii = Reshape(Ahat_ii.Read(), nidofs, nidofs, ne);

   const auto d_A_ib = Reshape(Ahat_ib.Read(), nidofs*nbdofs, ne);

   const auto d_A_bi = Reshape(Ahat_bi.Read(), nbdofs*nidofs, ne);

   const auto d_A_bb = Reshape(Ahat_bb.Read(), nbdofs*nbdofs, ne);


   const auto d_ipiv_ii = Reshape(Ahat_ii_piv.Read(), nidofs, ne);

   const auto d_ipiv_bb = Reshape(Ahat_bb_piv.Read(), nbdofs, ne);


   const auto *d_idofs = idofs.Read();

   const auto *d_bdofs = bdofs.Read();


   Vector ivals(nidofs*ne);

   Vector bvals(nbdofs*ne);

   auto d_ivals = Reshape(ivals.Write(), nidofs, ne);

   auto d_bvals = Reshape(bvals.Write(), nbdofs, ne);


   auto d_x = Reshape(x.ReadWrite(), n, ne);


   mfem::forall(ne, [=] MFEM_HOST_DEVICE (int e)

   {

      constexpr int MD1D = DofQuadLimits::HDIV_MAX_D1D;

      constexpr int MAX_DOFS = 3*MD1D*(MD1D-1)*(MD1D-1);

      internal::LocalMemory<int,MAX_DOFS> bdofs_loc;


      int nbfdofs = 0;

      for (int i = 0; i < nbdofs; i++)

      {

         const int dof_idx = d_bdofs[i];

         if (d_hat_dof_marker(dof_idx, e) != ESSENTIAL)

         {

            bdofs_loc[nbfdofs] = dof_idx;

            nbfdofs += 1;

         }

      }


      for (int i = 0; i < nidofs; ++i)

      {

         d_ivals(i, e) = d_x(d_idofs[i], e);

      }

      for (int i = 0; i < nbfdofs; ++i)

      {

         d_bvals(i, e) = d_x(bdofs_loc[i], e);

      }


      if (nidofs > 0)

      {

         // Block forward substitution:

         // B1 <- L^{-1} P B1

         kernels::LSolve(&d_A_ii(0,0,e), nidofs, &d_ipiv_ii(0,e), &d_ivals(0,e));

         // B2 <- B2 - L21 B1

         kernels::SubMult(

            nidofs, nbfdofs, 1, &d_A_bi(0,e), &d_ivals(0,e), &d_bvals(0, e));

      }


      // Schur complement solve

      kernels::LUSolve(&d_A_bb(0,e), nbfdofs, &d_ipiv_bb(0,e), &d_bvals(0,e));


      if (nidofs > 0)

      {

         // Block backward substitution

         // Y1 <- Y1 - U12 X2

         kernels::SubMult(

            nbfdofs, nidofs, 1, &d_A_ib(0,e), &d_bvals(0,e), &d_ivals(0, e));

         // Y1 <- U^{-1} Y1

         kernels::USolve(&d_A_ii(0,0,e), nidofs, &d_ivals(0,e));

      }


      for (int i = 0; i < nidofs; ++i)

      {

         d_x(d_idofs[i], e) = d_ivals(i, e);

      }

      for (int i = 0; i < nbfdofs; ++i)

      {

         d_x(bdofs_loc[i], e) = d_bvals(i, e);

      }

   });

}


void HybridizationExtension::ReduceRHS(const Vector &b, Vector &b_r) const

{

   Vector b_hat(num_hat_dofs);

   MultRt(b, b_hat);

   {

      const auto *d_hat_dof_marker = hat_dof_marker.Read();

      auto *d_b_hat = b_hat.ReadWrite();

      mfem::forall(num_hat_dofs, [=] MFEM_HOST_DEVICE (int i)

      {

         if (d_hat_dof_marker[i] == ESSENTIAL) { d_b_hat[i] = 0.0; }

      });

   }

   MultAhatInv(b_hat);

   const Operator *P = h.c_fes.GetProlongationMatrix();

   if (P)

   {

      Vector bl(P->Height());

      b_r.SetSize(P->Width());

      MultC(b_hat, bl);

      P->MultTranspose(bl, b_r);

   }

   else

   {

      MultC(b_hat, b_r);

   }

}


void HybridizationExtension::ComputeSolution(

   const Vector &b, const Vector &sol_r, Vector &sol) const

{

   // tmp1 = A_hat^{-1} ( R^T b - C^T lambda )

   Vector b_hat(num_hat_dofs);

   MultRt(b, b_hat);


   tmp1.SetSize(num_hat_dofs);

   const Operator *P = h.c_fes.GetProlongationMatrix();

   if (P)

   {

      Vector sol_l(P->Height());

      P->Mult(sol_r, sol_l);

      MultCt(sol_l, tmp1);

   }

   else

   {

      MultCt(sol_r, tmp1);

   }

   add(b_hat, -1.0, tmp1, tmp1);

   // Eliminate essential DOFs

   const auto *d_hat_dof_marker = hat_dof_marker.Read();

   real_t *d_tmp1 = tmp1.ReadWrite();

   mfem::forall(num_hat_dofs, [=] MFEM_HOST_DEVICE (int i)

   {

      if (d_hat_dof_marker[i] == ESSENTIAL) { d_tmp1[i] = 0.0; }

   });

   MultAhatInv(tmp1);

   MultR(tmp1, sol);

}


}

batched.hpp

mfem::Array
Definition array.hpp:48

mfem::Array::HostRead
const T * HostRead() const
Shortcut for mfem::Read(a.GetMemory(), a.Size(), false).
Definition array.hpp:385

mfem::Array::Reserve
void Reserve(int capacity)
Ensures that the allocated size is at least the given size.
Definition array.hpp:184

mfem::Array::SetSize
void SetSize(int nsize)
Change the logical size of the array, keep existing entries.
Definition array.hpp:840

mfem::Array::Size
int Size() const
Return the logical size of the array.
Definition array.hpp:166

mfem::Array::MakeRef
void MakeRef(T *data_, int size_, bool own_data=false)
Make this Array a reference to a pointer.
Definition array.hpp:1053

mfem::Array::Write
T * Write(bool on_dev=true)
Shortcut for mfem::Write(a.GetMemory(), a.Size(), on_dev).
Definition array.hpp:389

mfem::Array::Append
int Append(const T &el)
Append element 'el' to array, resize if necessary.
Definition array.hpp:912

mfem::Array::Read
const T * Read(bool on_dev=true) const
Shortcut for mfem::Read(a.GetMemory(), a.Size(), on_dev).
Definition array.hpp:381

mfem::Array::HostWrite
T * HostWrite()
Shortcut for mfem::Write(a.GetMemory(), a.Size(), false).
Definition array.hpp:393

mfem::DenseMatrix
Data type dense matrix using column-major storage.
Definition densemat.hpp:24

mfem::DenseMatrix::AdjustDofDirection
void AdjustDofDirection(Array< int > &dofs)
Definition densemat.cpp:2132

mfem::DenseMatrix::Read
const real_t * Read(bool on_dev=true) const
Shortcut for mfem::Read( GetMemory(), TotalSize(), on_dev).
Definition densemat.hpp:486

mfem::DenseTensor
Rank 3 tensor (array of matrices)
Definition densemat.hpp:1111

mfem::DenseTensor::TotalSize
int TotalSize() const
Definition densemat.hpp:1132

mfem::DenseTensor::Read
const real_t * Read(bool on_dev=true) const
Shortcut for mfem::Read( GetMemory(), TotalSize(), on_dev).
Definition densemat.hpp:1242

mfem::DeviceTensor
A basic generic Tensor class, appropriate for use on the GPU.
Definition dtensor.hpp:84

mfem::ElementRestriction
Operator that converts FiniteElementSpace L-vectors to E-vectors.
Definition restriction.hpp:41

mfem::ElementRestriction::GatherMap
const Array< int > & GatherMap() const
Definition restriction.hpp:104

mfem::Element::GetNFaces
virtual MFEM_DEPRECATED int GetNFaces(int &nFaceVertices) const =0

mfem::Element::GetNEdges
virtual int GetNEdges() const =0

mfem::FaceRestriction
Base class for operators that extracts Face degrees of freedom.
Definition restriction.hpp:167

mfem::FaceRestriction::MultTranspose
void MultTranspose(const Vector &x, Vector &y) const override
Set the face degrees of freedom in the element degrees of freedom y to the values given in x.
Definition restriction.hpp:232

mfem::FaceRestriction::GatherMap
virtual const Array< int > & GatherMap() const
Low-level access to the underlying gather map.
Definition restriction.hpp:284

mfem::FaceRestriction::Mult
void Mult(const Vector &x, Vector &y) const override=0
Extract the face degrees of freedom from x into y.

mfem::FiniteElementCollection::SubDofOrder
void SubDofOrder(Geometry::Type Geom, int SDim, int Info, Array< int > &dofs) const
Get the local dofs for a given sub-manifold.
Definition fe_coll.cpp:533

mfem::FiniteElementSpace::IsVariableOrder
bool IsVariableOrder() const
Returns true if the space contains elements of varying polynomial orders.
Definition fespace.hpp:678

mfem::FiniteElementSpace::GetTrueVSize
virtual int GetTrueVSize() const
Return the number of vector true (conforming) dofs.
Definition fespace.hpp:829

mfem::FiniteElementSpace::AdjustVDofs
static void AdjustVDofs(Array< int > &vdofs)
Remove the orientation information encoded into an array of dofs Some basis function types have a rel...
Definition fespace.cpp:282

mfem::FiniteElementSpace::GetProlongationMatrix
virtual const Operator * GetProlongationMatrix() const
Definition fespace.hpp:696

mfem::FiniteElementSpace::GetRestrictionOperator
virtual const Operator * GetRestrictionOperator() const
An abstract operator that performs the same action as GetRestrictionMatrix.
Definition fespace.hpp:715

mfem::FiniteElementSpace::GetFE
virtual const FiniteElement * GetFE(int i) const
Returns pointer to the FiniteElement in the FiniteElementCollection associated with i'th element in t...
Definition fespace.cpp:3824

mfem::FiniteElementSpace::GetNE
int GetNE() const
Returns number of elements in the mesh.
Definition fespace.hpp:869

mfem::FiniteElementSpace::GetElementRestriction
const ElementRestrictionOperator * GetElementRestriction(ElementDofOrdering e_ordering) const
Return an Operator that converts L-vectors to E-vectors.
Definition fespace.cpp:1480

mfem::FiniteElementSpace::GetFaceElement
const FiniteElement * GetFaceElement(int i) const
Returns pointer to the FiniteElement in the FiniteElementCollection associated with i'th face in the ...
Definition fespace.cpp:3903

mfem::FiniteElementSpace::GetNFbyType
int GetNFbyType(FaceType type) const
Returns the number of faces according to the requested type.
Definition fespace.hpp:886

mfem::FiniteElementSpace::FEColl
const FiniteElementCollection * FEColl() const
Definition fespace.hpp:856

mfem::FiniteElementSpace::GetMesh
Mesh * GetMesh() const
Returns the mesh.
Definition fespace.hpp:644

mfem::FiniteElementSpace::GetVSize
int GetVSize() const
Return the number of vector dofs, i.e. GetNDofs() x GetVDim().
Definition fespace.hpp:826

mfem::FiniteElementSpace::GetVDim
int GetVDim() const
Returns the vector dimension of the finite element space.
Definition fespace.hpp:819

mfem::FiniteElementSpace::GetFaceRestriction
virtual const FaceRestriction * GetFaceRestriction(ElementDofOrdering f_ordering, FaceType, L2FaceValues mul=L2FaceValues::DoubleValued) const
Return an Operator that converts L-vectors to E-vectors on each face.
Definition fespace.cpp:1513

mfem::FiniteElement::GetFaceMap
virtual void GetFaceMap(const int face_id, Array< int > &face_map) const
Return the mapping from lexicographic face DOFs to lexicographic element DOFs for the given local fac...
Definition fe_base.cpp:517

mfem::FiniteElement::GetDof
int GetDof() const
Returns the number of degrees of freedom in the finite element.
Definition fe_base.hpp:337

mfem::HybridizationExtension::Ahat_ii_piv
Array< int > Ahat_ii_piv
Definition hybridization_ext.hpp:55

mfem::HybridizationExtension::Ct_mat
Vector Ct_mat
Constraint matrix (transposed) stored element-wise.
Definition hybridization_ext.hpp:50

mfem::HybridizationExtension::ConstructC
void ConstructC()
Construct the constraint matrix.
Definition hybridization_ext.cpp:37

mfem::HybridizationExtension::Init
void Init(const Array< int > &ess_tdof_list)
Prepare for assembly; form the constraint matrix.
Definition hybridization_ext.cpp:718

mfem::HybridizationExtension::Ahat_ii
Vector Ahat_ii
Definition hybridization_ext.hpp:54

mfem::HybridizationExtension::face_to_el
Array< int > face_to_el
Definition hybridization_ext.hpp:49

mfem::HybridizationExtension::Ahat
Vector Ahat
Definition hybridization_ext.hpp:54

mfem::HybridizationExtension::Ahat_bb
Vector Ahat_bb
Definition hybridization_ext.hpp:54

mfem::HybridizationExtension::FactorElementMatrices
void FactorElementMatrices(Vector &AhatInvCt_mat)
Definition hybridization_ext.cpp:108

mfem::HybridizationExtension::ReduceRHS
void ReduceRHS(const Vector &b, Vector &b_r) const
Given a right-hand side on the original space, compute the corresponding right-hand side for the Lagr...
Definition hybridization_ext.cpp:1095

mfem::HybridizationExtension::el_to_face
Array< int > el_to_face
Definition hybridization_ext.hpp:48

mfem::HybridizationExtension::hat_dof_gather_map
Array< int > hat_dof_gather_map
Definition hybridization_ext.hpp:45

mfem::HybridizationExtension::ComputeSolution
void ComputeSolution(const Vector &b, const Vector &sol_r, Vector &sol) const
Given Lagrange multipliers sol_r and the original right-hand side b, recover the solution sol on the ...
Definition hybridization_ext.cpp:1122

mfem::HybridizationExtension::Ahat_bb_piv
Array< int > Ahat_bb_piv
Definition hybridization_ext.hpp:55

mfem::HybridizationExtension::bdofs
Array< int > bdofs
Definition hybridization_ext.hpp:52

mfem::HybridizationExtension::DofType
DofType
Definition hybridization_ext.hpp:35

mfem::HybridizationExtension::BOUNDARY
@ BOUNDARY
Definition hybridization_ext.hpp:37

mfem::HybridizationExtension::ESSENTIAL
@ ESSENTIAL
Definition hybridization_ext.hpp:36

mfem::HybridizationExtension::INTERIOR
@ INTERIOR
Definition hybridization_ext.hpp:38

mfem::HybridizationExtension::hat_dof_marker
Array< DofType > hat_dof_marker
Definition hybridization_ext.hpp:46

mfem::HybridizationExtension::HybridizationExtension
HybridizationExtension(class Hybridization &hybridization_)
Constructor.
Definition hybridization_ext.cpp:22

mfem::HybridizationExtension::tmp1
Vector tmp1
Definition hybridization_ext.hpp:43

mfem::HybridizationExtension::tmp2
Vector tmp2
Temporary vectors.
Definition hybridization_ext.hpp:43

mfem::HybridizationExtension::ConstructH
void ConstructH()
Form the Schur complement matrix .
Definition hybridization_ext.cpp:298

mfem::HybridizationExtension::MultR
void MultR(const Vector &b, Vector &b_hat) const
Apply the action of R mapping from "hat DOFs" to T-vector.
Definition hybridization_ext.cpp:929

mfem::HybridizationExtension::Ahat_bi
Vector Ahat_bi
Definition hybridization_ext.hpp:54

mfem::HybridizationExtension::MultC
void MultC(const Vector &x, Vector &y) const
Compute the action of C x.
Definition hybridization_ext.cpp:605

mfem::HybridizationExtension::MultAhatInv
void MultAhatInv(Vector &x) const
Apply the elementwise A_hat^{-1}.
Definition hybridization_ext.cpp:1007

mfem::HybridizationExtension::idofs
Array< int > idofs
Definition hybridization_ext.hpp:52

mfem::HybridizationExtension::num_hat_dofs
int num_hat_dofs
Number of Lagrange multipliers.
Definition hybridization_ext.hpp:42

mfem::HybridizationExtension::AssembleMatrix
void AssembleMatrix(int el, const class DenseMatrix &elmat)
Assemble the element matrix A into the hybridized system matrix.
Definition hybridization_ext.cpp:650

mfem::HybridizationExtension::MultCt
void MultCt(const Vector &x, Vector &y) const
Compute the action of C^t x.
Definition hybridization_ext.cpp:565

mfem::HybridizationExtension::h
class Hybridization & h
The associated Hybridization object.=.
Definition hybridization_ext.hpp:41

mfem::HybridizationExtension::Ahat_ib
Vector Ahat_ib
Definition hybridization_ext.hpp:54

mfem::HybridizationExtension::MultRt
void MultRt(const Vector &b, Vector &b_hat) const
Apply the action of R^t mapping into the "hat DOF" space.
Definition hybridization_ext.cpp:972

mfem::HybridizationExtension::AssembleBdrMatrix
void AssembleBdrMatrix(int bdr_el, const class DenseMatrix &elmat)
Assemble the boundary element matrix A into the hybridized system matrix.
Definition hybridization_ext.cpp:662

mfem::HybridizationExtension::AssembleElementMatrices
void AssembleElementMatrices(const class DenseTensor &el_mats)
Invert and store the element matrices Ahat.
Definition hybridization_ext.cpp:708

mfem::Hybridization
Auxiliary class Hybridization, used to implement BilinearForm hybridization.
Definition hybridization.hpp:63

mfem::Hybridization::hat_offsets
Array< int > hat_offsets
Definition hybridization.hpp:84

mfem::Hybridization::c_fes
FiniteElementSpace & c_fes
Definition hybridization.hpp:67

mfem::Hybridization::H
std::unique_ptr< SparseMatrix > H
The Schur complement system for the Lagrange multiplier.
Definition hybridization.hpp:82

mfem::Hybridization::pH
OperatorHandle pH
Definition hybridization.hpp:91

mfem::Hybridization::fes
FiniteElementSpace & fes
The finite element space.
Definition hybridization.hpp:66

mfem::Hybridization::c_bfi
std::unique_ptr< BilinearFormIntegrator > c_bfi
The constraint integrator.
Definition hybridization.hpp:71

mfem::HypreParMatrix
Wrapper for hypre's ParCSR matrix class.
Definition hypre.hpp:419

mfem::HypreParMatrix::BooleanMult
void BooleanMult(int alpha, const int *x, int beta, int *y)
The "Boolean" analog of y = alpha * A * x + beta * y, where elements in the sparsity pattern of the m...
Definition hypre.hpp:807

mfem::Mesh
Mesh data type.
Definition mesh.hpp:65

mfem::Mesh::Conforming
bool Conforming() const
Definition mesh.cpp:15455

mfem::Mesh::GetNumFaces
int GetNumFaces() const
Return the number of faces (3D), edges (2D) or vertices (1D).
Definition mesh.cpp:6846

mfem::Mesh::GetElementGeometry
Geometry::Type GetElementGeometry(int i) const
Definition mesh.hpp:1535

mfem::Mesh::GetNFbyType
virtual int GetNFbyType(FaceType type) const
Returns the number of faces according to the requested type, does not count master nonconforming face...
Definition mesh.cpp:6862

mfem::Mesh::GetElement
const Element * GetElement(int i) const
Return pointer to the i'th element object.
Definition mesh.hpp:1434

mfem::Mesh::GetNE
int GetNE() const
Returns number of elements.
Definition mesh.hpp:1377

mfem::Mesh::Dimension
int Dimension() const
Dimension of the reference space used within the elements.
Definition mesh.hpp:1306

mfem::Mesh::GetFaceInformation
FaceInformation GetFaceInformation(int f) const
Definition mesh.cpp:1293

mfem::Mesh::GetBdrElementAdjacentElement
void GetBdrElementAdjacentElement(int bdr_el, int &el, int &info) const
For the given boundary element, bdr_el, return its adjacent element and its info, i....
Definition mesh.cpp:7905

mfem::OperatorHandle
Pointer to an Operator of a specified type.
Definition handle.hpp:34

mfem::OperatorHandle::MakePtAP
void MakePtAP(OperatorHandle &A, OperatorHandle &P)
Reset the OperatorHandle to hold the product P^t A P.
Definition handle.cpp:124

mfem::OperatorHandle::MakeSquareBlockDiag
void MakeSquareBlockDiag(MPI_Comm comm, HYPRE_BigInt glob_size, HYPRE_BigInt *row_starts, SparseMatrix *diag)
Reset the OperatorHandle to hold a parallel square block-diagonal matrix using the currently set type...
Definition handle.cpp:61

mfem::OperatorHandle::Type
Operator::Type Type() const
Get the currently set operator type id.
Definition handle.hpp:99

mfem::Operator
Abstract operator.
Definition operator.hpp:25

mfem::Operator::Height
int Height() const
Get the height (size of output) of the Operator. Synonym with NumRows().
Definition operator.hpp:66

mfem::Operator::Mult
virtual void Mult(const Vector &x, Vector &y) const =0
Operator application: y=A(x).

mfem::Operator::Width
int Width() const
Get the width (size of input) of the Operator. Synonym with NumCols().
Definition operator.hpp:72

mfem::Operator::MultTranspose
virtual void MultTranspose(const Vector &x, Vector &y) const
Action of the transpose operator: y=A^t(x). The default behavior in class Operator is to generate an ...
Definition operator.hpp:100

mfem::ParFiniteElementSpace
Abstract parallel finite element space.
Definition pfespace.hpp:31

mfem::SparseMatrix
Data type sparse matrix.
Definition sparsemat.hpp:51

mfem::TensorBasisElement
Definition fe_base.hpp:1250

mfem::TensorBasisElement::GetDofMap
const Array< int > & GetDofMap() const
Get an Array<int> that maps lexicographically ordered indices to the indices of the respective nodes/...
Definition fe_base.hpp:1276

mfem::Vector
Vector data type.
Definition vector.hpp:82

mfem::Vector::Read
virtual const real_t * Read(bool on_dev=true) const
Shortcut for mfem::Read(vec.GetMemory(), vec.Size(), on_dev).
Definition vector.hpp:520

mfem::Vector::ReadWrite
virtual real_t * ReadWrite(bool on_dev=true)
Shortcut for mfem::ReadWrite(vec.GetMemory(), vec.Size(), on_dev).
Definition vector.hpp:536

mfem::Vector::Size
int Size() const
Returns the size of the vector.
Definition vector.hpp:234

mfem::Vector::UseDevice
virtual void UseDevice(bool use_dev) const
Enable execution of Vector operations using the mfem::Device.
Definition vector.hpp:145

mfem::Vector::SetSize
void SetSize(int s)
Resize the vector to size s.
Definition vector.hpp:584

mfem::Vector::HostReadWrite
virtual real_t * HostReadWrite()
Shortcut for mfem::ReadWrite(vec.GetMemory(), vec.Size(), false).
Definition vector.hpp:540

mfem::Vector::Write
virtual real_t * Write(bool on_dev=true)
Shortcut for mfem::Write(vec.GetMemory(), vec.Size(), on_dev).
Definition vector.hpp:528

mfem::Vector::MakeRef
void MakeRef(Vector &base, int offset, int size)
Reset the Vector to be a reference to a sub-vector of base.
Definition vector.hpp:660

dim
int dim
Definition ex24.cpp:53

forall.hpp

hybridization.hpp

hybridization_ext.hpp

kernels.hpp

b
real_t b
Definition lissajous.cpp:42

mfem::kernels::AddMultAtB
MFEM_HOST_DEVICE void AddMultAtB(const int Aheight, const int Awidth, const int Bwidth, const TA *Adata, const TB *Bdata, TC *Cdata, const TB alpha, const TA beta)
Compute C = alpha*At*B + beta*C.
Definition kernels.hpp:471

mfem::kernels::LSolve
MFEM_HOST_DEVICE void LSolve(const real_t *data, const int m, const int *ipiv, real_t *x)
Assuming L.U = P.A factored matrix of size (m x m), compute X <- L^{-1} P X, for a vector X of length...
Definition kernels.hpp:1760

mfem::kernels::USolve
MFEM_HOST_DEVICE void USolve(const real_t *data, const int m, real_t *x)
Assuming L.U = P.A factored matrix of size (m x m), compute X <- U^{-1} X, for a vector X of length m...
Definition kernels.hpp:1785

mfem::kernels::BlockFactor
MFEM_HOST_DEVICE void BlockFactor(const real_t *data, int m, const int *ipiv, int n, real_t *A12, real_t *A21, real_t *A22)
Definition kernels.hpp:1843

mfem::kernels::LUFactor
MFEM_HOST_DEVICE bool LUFactor(real_t *A, const int m, int *ipiv, const real_t tol=0.0)
Compute the LU factorization of the m x m matrix A.
Definition kernels.hpp:1885

mfem::kernels::SubMult
MFEM_HOST_DEVICE void SubMult(const int m, const int n, const int r, const real_t *A21, const real_t *X1, real_t *X2)
Given an (n x m) matrix A21, compute X2 <- X2 - A21 X1, for matrices X1, and X2 of size (m x r) and (...
Definition kernels.hpp:1815

mfem::kernels::LUSolve
MFEM_HOST_DEVICE void LUSolve(const real_t *data, const int m, const int *ipiv, real_t *x)
Assuming L.U = P.A for a factored matrix (m x m),.
Definition kernels.hpp:1805

mfem
Definition CodeDocumentation.dox:1

mfem::add
void add(const Vector &v1, const Vector &v2, Vector &v)
Definition vector.cpp:414

mfem::Reshape
MFEM_HOST_DEVICE DeviceTensor< sizeof...(Dims), T > Reshape(T *ptr, Dims... dims)
Wrap a pointer as a DeviceTensor with automatically deduced template parameters.
Definition dtensor.hpp:138

mfem::UsesTensorBasis
bool UsesTensorBasis(const FiniteElementSpace &fes)
Return true if the mesh contains only one topology and the elements are tensor elements.
Definition fespace.hpp:1548

mfem::real_t
float real_t
Definition config.hpp:46

mfem::MemoryType::SIZE
@ SIZE
Number of host and device memory types.

mfem::ElementDofOrdering
ElementDofOrdering
Constants describing the possible orderings of the DOFs in one element.
Definition fespace.hpp:47

mfem::ElementDofOrdering::NATIVE
@ NATIVE
Native ordering as defined by the FiniteElement.

mfem::f
std::function< real_t(const Vector &)> f(real_t mass_coeff)
Definition lor_mms.hpp:30

mfem::forall
void forall(int N, lambda &&body)
Definition forall.hpp:839

mfem::FaceType::Interior
@ Interior

pfespace.hpp

mfem::Mesh::FaceInformation
This structure is used as a human readable output format that deciphers the information contained in ...
Definition mesh.hpp:2081

mfem::Mesh::FaceInformation::index
int index
Definition mesh.hpp:2088

mfem::Mesh::FaceInformation::element
struct mfem::Mesh::FaceInformation::@15 element[2]

mfem::Mesh::FaceInformation::IsInterior
bool IsInterior() const
return true if the face is an interior face to the computation domain, either a local or shared inter...
Definition mesh.hpp:2115

mfem::Mesh::FaceInformation::local_face_id
int local_face_id
Definition mesh.hpp:2089

mfem::Mesh::FaceInformation::IsShared
bool IsShared() const
Return true if the face is a shared interior face which is NOT a master nonconforming face.
Definition mesh.hpp:2106