4.5.2/lor__rt_8cpp_source.html

 // Copyright (c) 2010-2023, Lawrence Livermore National Security, LLC. Produced
 // at the Lawrence Livermore National Laboratory. All Rights reserved. See files
 // LICENSE and NOTICE for details. LLNL-CODE-806117.
 //
 // This file is part of the MFEM library. For more information and source code
 // availability visit https://mfem.org.
 //
 // MFEM is free software; you can redistribute it and/or modify it under the
 // terms of the BSD-3 license. We welcome feedback and contributions, see file
 // CONTRIBUTING.md for details.

 #include "lor_rt.hpp"
 #include "lor_util.hpp"
 #include "../../linalg/dtensor.hpp"
 #include "../../general/forall.hpp"

 namespace mfem
 {

 template <int ORDER>
 void BatchedLOR_RT::Assemble2D()
 {
    const int nel_ho = fes_ho.GetNE();

    static constexpr int nv = 4;
    static constexpr int ne = 4;
    static constexpr int dim = 2;
    static constexpr int ddm2 = (dim*(dim+1))/2;
    static constexpr int ngeom = ddm2 + 1;
    static constexpr int o = ORDER;
    static constexpr int op1 = ORDER + 1;
    static constexpr int ndof_per_el = dim*o*op1;
    static constexpr int nnz_per_row = 7;
    static constexpr int sz_local_mat = ne*ne;

    const bool const_mq = c1.Size() == 1;
    const auto MQ = const_mq
                    ? Reshape(c1.Read(), 1, 1, 1)
                    : Reshape(c1.Read(), op1, op1, nel_ho);
    const bool const_dq = c2.Size() == 1;
    const auto DQ = const_dq
                    ? Reshape(c2.Read(), 1, 1, 1)
                    : Reshape(c2.Read(), op1, op1, nel_ho);

    sparse_ij.SetSize(nnz_per_row*ndof_per_el*nel_ho);
    auto V = Reshape(sparse_ij.Write(), nnz_per_row, o*op1, dim, nel_ho);

    auto X = X_vert.Read();

    MFEM_FORALL_2D(iel_ho, nel_ho, ORDER, ORDER, 1,
    {
       MFEM_FOREACH_THREAD(iy,y,o)
       {
          MFEM_FOREACH_THREAD(ix,x,op1)
          {
             for (int c=0; c<2; ++c)
             {
                for (int j=0; j<nnz_per_row; ++j)
                {
                   V(j,ix+iy*op1,c,iel_ho) = 0.0;
                }
             }
          }
       }
       MFEM_SYNC_THREAD;

       // Loop over the sub-elements
       MFEM_FOREACH_THREAD(ky,y,ORDER)
       {
          MFEM_FOREACH_THREAD(kx,x,ORDER)
          {
             // Compute geometric factors at quadrature points
             double Q_[ngeom*nv];
             double local_mat_[sz_local_mat];

             DeviceTensor<3> Q(Q_, ngeom, 2, 2);
             DeviceTensor<2> local_mat(local_mat_, ne, ne);

             // local_mat is the local (dense) stiffness matrix
             for (int i=0; i<sz_local_mat; ++i) { local_mat[i] = 0.0; }

             double vx[4], vy[4];
             LORVertexCoordinates2D<ORDER>(X, iel_ho, kx, ky, vx, vy);

             for (int iqx=0; iqx<2; ++iqx)
             {
                for (int iqy=0; iqy<2; ++iqy)
                {
                   const double x = iqx;
                   const double y = iqy;
                   const double w = 1.0/4.0;

                   double J_[2*2];
                   DeviceTensor<2> J(J_, 2, 2);

                   Jacobian2D(x, y, vx, vy, J);

                   const double detJ = Det2D(J);
                   const double w_detJ = w/detJ;

                   Q(0,iqy,iqx) = w_detJ * (J(0,0)*J(0,0) + J(1,0)*J(1,0)); // 1,1
                   Q(1,iqy,iqx) = w_detJ * (J(0,0)*J(0,1) + J(1,0)*J(1,1)); // 1,2
                   Q(2,iqy,iqx) = w_detJ * (J(0,1)*J(0,1) + J(1,1)*J(1,1)); // 2,2
                   Q(3,iqy,iqx) = w_detJ;
                }
             }
             for (int iqx=0; iqx<2; ++iqx)
             {
                for (int iqy=0; iqy<2; ++iqy)
                {
                   const double mq = const_mq ? MQ(0,0,0) : MQ(kx+iqx, ky+iqy, iel_ho);
                   const double dq = const_dq ? DQ(0,0,0) : DQ(kx+iqx, ky+iqy, iel_ho);
                   // Loop over x,y components. c=0 => x, c=1 => y
                   for (int cj=0; cj<dim; ++cj)
                   {
                      for (int bj=0; bj<2; ++bj)
                      {
                         const double bxj = (cj == 0 && bj == iqx) ? 1 : 0;
                         const double byj = (cj == 1 && bj == iqy) ? 1 : 0;
                         const double div_j = (bj == 0) ? -1 : 1;

                         const double jj_loc = bj + 2*cj;

                         for (int ci=0; ci<dim; ++ci)
                         {
                            for (int bi=0; bi<2; ++bi)
                            {
                               const double bxi = (ci == 0 && bi == iqx) ? 1 : 0;
                               const double byi = (ci == 1 && bi == iqy) ? 1 : 0;
                               const double div_i = (bi == 0) ? -1 : 1;

                               const double ii_loc = bi + 2*ci;

                               // Only store the lower-triangular part of
                               // the matrix (by symmetry).
                               if (jj_loc > ii_loc) { continue; }

                               double val = 0.0;
                               val += bxi*bxj*Q(0,iqy,iqx);
                               val += byi*bxj*Q(1,iqy,iqx);
                               val += bxi*byj*Q(1,iqy,iqx);
                               val += byi*byj*Q(2,iqy,iqx);
                               val *= mq;
                               val += dq*div_j*div_i*Q(3,iqy,iqx);

                               local_mat(ii_loc, jj_loc) += val;
                            }
                         }
                      }
                   }
                }
             }
             // Assemble the local matrix into the macro-element sparse matrix
             // in a format similar to coordinate format. The (I,J) arrays
             // are implicit (not stored explicitly).
             for (int ii_loc=0; ii_loc<ne; ++ii_loc)
             {
                const int ci = ii_loc/2;
                const int bi = ii_loc%2;
                const int ix = (ci == 0) ? bi : 0;
                const int iy = (ci == 1) ? bi : 0;

                int ii = kx+ix + (ky+iy)*((ci == 0) ? op1 : o);

                for (int jj_loc=0; jj_loc<ne; ++jj_loc)
                {
                   const int cj = jj_loc/2;
                   const int bj = jj_loc%2;

                   const int jj_off = (ci == cj) ? (bj - bi + 1) : (3 + 1-bi + 2*bj);

                   // Symmetry
                   const double val = (jj_loc <= ii_loc)
                                      ? local_mat(ii_loc, jj_loc)
                                      : local_mat(jj_loc, ii_loc);
                   AtomicAdd(V(jj_off, ii, ci, iel_ho), val);
                }
             }
          }
       }
    });

    sparse_mapping.SetSize(nnz_per_row*ndof_per_el);
    sparse_mapping = -1;
    auto map = Reshape(sparse_mapping.HostReadWrite(), nnz_per_row, ndof_per_el);
    for (int ci=0; ci<2; ++ci)
    {
       const int i_off = (ci == 0) ? 0 : o*op1;
       const int id0 = ci;
       const int id1 = (ci+1)%2;

       const int nxi = (ci == 0) ? op1 : o;

       for (int i0=0; i0<op1; ++i0)
       {
          for (int i1=0; i1<o; ++i1)
          {
             int ii_lex[2];
             ii_lex[id0] = i0;
             ii_lex[id1] = i1;
             const int ii_el = i_off + ii_lex[0] + ii_lex[1]*nxi;

             for (int cj_rel=0; cj_rel<2; ++cj_rel)
             {
                const int cj = (ci + cj_rel) % 2;
                const int j_off = (cj == 0) ? 0 : o*op1;
                const int nxj = (cj == 0) ? op1 : o;

                const int j0_begin = (i0 > 0) ? i0-1 : i0;
                const int j0_end = (cj_rel == 0)
                                   ? ((i0 < o) ? i0+1 : i0)
                                   : ((i0 < o) ? i0 : i0-1);
                const int j1_begin = i1;
                const int j1_end = (cj_rel == 0) ? i1 : i1+1;

                for (int j0=j0_begin; j0<=j0_end; ++j0)
                {
                   const int d0 = 1 + j0 - i0;
                   for (int j1=j1_begin; j1<=j1_end; ++j1)
                   {
                      const int d1 = j1 - i1;
                      int jj_lex[2];
                      jj_lex[id0] = j0;
                      jj_lex[id1] = j1;
                      const int jj_el = j_off + jj_lex[0] + jj_lex[1]*nxj;
                      const int jj_off = (cj_rel == 0) ? d0 : 3 + d0 + 2*d1;
                      map(jj_off, ii_el) = jj_el;
                   }
                }
             }
          }
       }
    }
 }

 template <int ORDER>
 void BatchedLOR_RT::Assemble3D()
 {
    const int nel_ho = fes_ho.GetNE();

    static constexpr int nv = 8; // number of vertices in hexahedron
    static constexpr int nf = 6; // number of faces in hexahedron
    static constexpr int dim = 3;
    static constexpr int ddm2 = (dim*(dim+1))/2;
    static constexpr int ngeom = ddm2 + 1; // number of geometric factors stored
    static constexpr int o = ORDER;
    static constexpr int op1 = ORDER + 1;
    static constexpr int ndof_per_el = dim*o*o*op1;
    static constexpr int nnz_per_row = 11;
    static constexpr int sz_local_mat = nf*nf;

    const bool const_mq = c1.Size() == 1;
    const auto MQ = const_mq
                    ? Reshape(c1.Read(), 1, 1, 1, 1)
                    : Reshape(c1.Read(), op1, op1, op1, nel_ho);
    const bool const_dq = c2.Size() == 1;
    const auto DQ = const_dq
                    ? Reshape(c2.Read(), 1, 1, 1, 1)
                    : Reshape(c2.Read(), op1, op1, op1, nel_ho);

    sparse_ij.SetSize(nnz_per_row*ndof_per_el*nel_ho);
    auto V = Reshape(sparse_ij.Write(), nnz_per_row, o*o*op1, dim, nel_ho);

    auto X = X_vert.Read();

    // Last thread dimension is lowered to avoid "too many resources" error
    MFEM_FORALL_3D(iel_ho, nel_ho, ORDER, ORDER, (ORDER>6)?4:ORDER,
    {
       MFEM_FOREACH_THREAD(iz,z,o)
       {
          MFEM_FOREACH_THREAD(iy,y,o)
          {
             MFEM_FOREACH_THREAD(ix,x,op1)
             {
                for (int c=0; c<dim; ++c)
                {
                   for (int j=0; j<nnz_per_row; ++j)
                   {
                      V(j,ix+iy*op1+iz*o*op1,c,iel_ho) = 0.0;
                   }
                }
             }
          }
       }
       MFEM_SYNC_THREAD;

       // Loop over the sub-elements
       MFEM_FOREACH_THREAD(kz,z,ORDER)
       {
          MFEM_FOREACH_THREAD(ky,y,ORDER)
          {
             MFEM_FOREACH_THREAD(kx,x,ORDER)
             {
                // Geometric factors at quadrature points (element vertices)
                double Q_[ngeom*nv];
                DeviceTensor<4> Q(Q_, ngeom, 2, 2, 2);

                double local_mat_[sz_local_mat];
                DeviceTensor<2> local_mat(local_mat_, nf, nf);
                for (int i=0; i<sz_local_mat; ++i) { local_mat[i] = 0.0; }

                double vx[8], vy[8], vz[8];
                LORVertexCoordinates3D<ORDER>(X, iel_ho, kx, ky, kz, vx, vy, vz);

                for (int iqz=0; iqz<2; ++iqz)
                {
                   for (int iqy=0; iqy<2; ++iqy)
                   {
                      for (int iqx=0; iqx<2; ++iqx)
                      {
                         const double x = iqx;
                         const double y = iqy;
                         const double z = iqz;
                         const double w = 1.0/8.0;

                         double J_[3*3];
                         DeviceTensor<2> J(J_, 3, 3);

                         Jacobian3D(x, y, z, vx, vy, vz, J);

                         const double detJ = Det3D(J);
                         const double w_detJ = w/detJ;

                         Q(0,iqz,iqy,iqx) = w_detJ*(J(0,0)*J(0,0)+J(1,0)*J(1,0)+J(2,0)*J(2,0)); // 1,1
                         Q(1,iqz,iqy,iqx) = w_detJ*(J(0,1)*J(0,0)+J(1,1)*J(1,0)+J(2,1)*J(2,0)); // 2,1
                         Q(2,iqz,iqy,iqx) = w_detJ*(J(0,2)*J(0,0)+J(1,2)*J(1,0)+J(2,2)*J(2,0)); // 3,1
                         Q(3,iqz,iqy,iqx) = w_detJ*(J(0,1)*J(0,1)+J(1,1)*J(1,1)+J(2,1)*J(2,1)); // 2,2
                         Q(4,iqz,iqy,iqx) = w_detJ*(J(0,2)*J(0,1)+J(1,2)*J(1,1)+J(2,2)*J(2,1)); // 3,2
                         Q(5,iqz,iqy,iqx) = w_detJ*(J(0,2)*J(0,2)+J(1,2)*J(1,2)+J(2,2)*J(2,2)); // 3,3
                         Q(6,iqz,iqy,iqx) = w_detJ;
                      }
                   }
                }
                for (int iqz=0; iqz<2; ++iqz)
                {
                   for (int iqy=0; iqy<2; ++iqy)
                   {
                      for (int iqx=0; iqx<2; ++iqx)
                      {
                         const double mq = const_mq ? MQ(0,0,0,0) : MQ(kx+iqx, ky+iqy, kz+iqz, iel_ho);
                         const double dq = const_dq ? DQ(0,0,0,0) : DQ(kx+iqx, ky+iqy, kz+iqz, iel_ho);
                         // Loop over x,y,z components. 0 => x, 1 => y, 2 => z
                         for (int cj=0; cj<dim; ++cj)
                         {
                            const double jq0 = (cj == 0) ? iqx : ((cj == 1) ? iqy : iqz);

                            const int jd_0 = cj;
                            const int jd_1 = (cj + 1)%3;
                            const int jd_2 = (cj + 2)%3;

                            for (int bj=0; bj<2; ++bj) // 2 faces in each dim
                            {
                               const double div_j = (bj == 0) ? -1 : 1;

                               double basis_j[3];
                               basis_j[jd_0] = (bj == jq0) ? 1 : 0;
                               basis_j[jd_1] = 0.0;
                               basis_j[jd_2] = 0.0;

                               const int jj_loc = bj + 2*cj;

                               for (int ci=0; ci<dim; ++ci)
                               {
                                  const double iq0 = (ci == 0) ? iqx : ((ci == 1) ? iqy : iqz);

                                  const int id_0 = ci;
                                  const int id_1 = (ci + 1)%3;
                                  const int id_2 = (ci + 2)%3;

                                  for (int bi=0; bi<2; ++bi)
                                  {
                                     const double div_i = (bi == 0) ? -1 : 1;

                                     double basis_i[3];
                                     basis_i[id_0] = (bi == iq0) ? 1 : 0;
                                     basis_i[id_1] = 0.0;
                                     basis_i[id_2] = 0.0;

                                     const int ii_loc = bi + 2*ci;

                                     // Only store the lower-triangular part of
                                     // the matrix (by symmetry).
                                     if (jj_loc > ii_loc) { continue; }

                                     const double div_div = Q(6,iqz,iqy,iqx)*div_i*div_j;

                                     double basis_basis = 0.0;
                                     basis_basis += Q(0,iqz,iqy,iqx)*basis_i[0]*basis_j[0];
                                     basis_basis += Q(1,iqz,iqy,iqx)*(basis_i[0]*basis_j[1] + basis_i[1]*basis_j[0]);
                                     basis_basis += Q(2,iqz,iqy,iqx)*(basis_i[0]*basis_j[2] + basis_i[2]*basis_j[0]);
                                     basis_basis += Q(3,iqz,iqy,iqx)*basis_i[1]*basis_j[1];
                                     basis_basis += Q(4,iqz,iqy,iqx)*(basis_i[1]*basis_j[2] + basis_i[2]*basis_j[1]);
                                     basis_basis += Q(5,iqz,iqy,iqx)*basis_i[2]*basis_j[2];

                                     const double val = dq*div_div + mq*basis_basis;
                                     // const double val = 1.0;

                                     local_mat(ii_loc, jj_loc) += val;
                                  }
                               }
                            }
                         }
                      }
                   }
                }
                // Assemble the local matrix into the macro-element sparse matrix
                // The nonzeros of the macro-element sparse matrix are ordered as
                // follows:
                //
                // The axes are ordered relative to the direction of the basis
                // vector, e.g. for x-vectors, the axes are (x,y,z), for
                // y-vectors the axes are (y,z,x), and for z-vectors the axes are
                // (z,x,y).
                //
                // The nonzeros are then given in "rotated lexicographic"
                // ordering, according to these axes.
                for (int ii_loc=0; ii_loc<nf; ++ii_loc)
                {
                   const int ci = ii_loc/2;
                   const int bi = ii_loc%2;

                   const int id0 = ci;
                   const int id1 = (ci+1)%3;
                   const int id2 = (ci+2)%3;

                   const int i0 = bi;
                   const int i1 = 0;
                   const int i2 = 0;

                   int ii_lex[3];
                   ii_lex[id0] = i0;
                   ii_lex[id1] = i1;
                   ii_lex[id2] = i2;

                   const int nx = (ci == 0) ? op1 : o;
                   const int ny = (ci == 1) ? op1 : o;

                   const int ii = kx+ii_lex[0] + (ky+ii_lex[1])*nx + (kz+ii_lex[2])*nx*ny;

                   for (int jj_loc=0; jj_loc<nf; ++jj_loc)
                   {
                      const int cj = jj_loc/2;
                      // add 3 to take modulus (rather than remainder) when
                      // (cj - ci) is negative
                      const int cj_rel = (3 + cj - ci)%3;

                      const int bj = jj_loc%2;

                      const int jd0 = cj_rel;
                      const int jd1 = (cj_rel+1)%3;
                      const int jd2 = (cj_rel+2)%3;

                      int jj_rel[3];
                      jj_rel[jd0] = bj;
                      jj_rel[jd1] = 0;
                      jj_rel[jd2] = 0;

                      const int d0 = jj_rel[0] - i0 + 1;
                      const int d1 = jj_rel[1] - i1;
                      const int d2 = jj_rel[2] - i2;
                      int jj_off;
                      if (cj_rel == 0) { jj_off = d0; }
                      else if (cj_rel == 1) { jj_off = 3 + d0 + 2*d1; }
                      else /* if (cj_rel == 2) */ { jj_off = 7 + d0 + 2*d2; }

                      // Symmetry
                      const double val = (jj_loc <= ii_loc)
                                         ? local_mat(ii_loc, jj_loc)
                                         : local_mat(jj_loc, ii_loc);
                      AtomicAdd(V(jj_off, ii, ci, iel_ho), val);
                   }
                }
             }
          }
       }
    });

    sparse_mapping.SetSize(nnz_per_row*ndof_per_el);
    sparse_mapping = -1;
    auto map = Reshape(sparse_mapping.HostReadWrite(), nnz_per_row, ndof_per_el);
    for (int ci=0; ci<dim; ++ci)
    {
       const int i_off = ci*o*o*op1;
       const int id0 = ci;
       const int id1 = (ci+1)%3;
       const int id2 = (ci+2)%3;

       const int nxi = (ci == 0) ? op1 : o;
       const int nyi = (ci == 1) ? op1 : o;

       for (int i0=0; i0<op1; ++i0)
       {
          for (int i1=0; i1<o; ++i1)
          {
             for (int i2=0; i2<o; ++i2)
             {
                int ii_lex[3];
                ii_lex[id0] = i0;
                ii_lex[id1] = i1;
                ii_lex[id2] = i2;
                const int ii_el = i_off + ii_lex[0] + ii_lex[1]*nxi + ii_lex[2]*nxi*nyi;

                for (int cj_rel=0; cj_rel<dim; ++cj_rel)
                {
                   const int cj = (ci + cj_rel) % 3;
                   const int j_off = cj*o*o*op1;

                   const int nxj = (cj == 0) ? op1 : o;
                   const int nyj = (cj == 1) ? op1 : o;

                   const int j0_begin = (i0 > 0) ? i0-1 : i0;
                   const int j0_end = (cj_rel == 0)
                                      ? ((i0 < o) ? i0+1 : i0)
                                      : ((i0 < o) ? i0 : i0-1);
                   const int j1_begin = i1;
                   const int j1_end = (cj_rel == 1) ? i1+1 : i1;
                   const int j2_begin = i2;
                   const int j2_end = (cj_rel == 2) ? i2+1 : i2;

                   for (int j0=j0_begin; j0<=j0_end; ++j0)
                   {
                      const int d0 = 1 + j0 - i0;
                      for (int j1=j1_begin; j1<=j1_end; ++j1)
                      {
                         const int d1 = j1 - i1;
                         for (int j2=j2_begin; j2<=j2_end; ++j2)
                         {
                            const int d2 = j2 - i2;
                            int jj_lex[3];
                            jj_lex[id0] = j0;
                            jj_lex[id1] = j1;
                            jj_lex[id2] = j2;
                            const int jj_el = j_off + jj_lex[0] + jj_lex[1]*nxj + jj_lex[2]*nxj*nyj;
                            int jj_off;
                            if (cj_rel == 0) { jj_off = d0; }
                            else if (cj_rel == 1) { jj_off = 3 + d0 + 2*d1; }
                            else /* if (cj_rel == 2) */ { jj_off = 7 + d0 + 2*d2; }
                            map(jj_off, ii_el) = jj_el;
                         }
                      }
                   }
                }
             }
          }
       }
    }
 }

 // Explicit template instantiations
 template void BatchedLOR_RT::Assemble2D<1>();
 template void BatchedLOR_RT::Assemble2D<2>();
 template void BatchedLOR_RT::Assemble2D<3>();
 template void BatchedLOR_RT::Assemble2D<4>();
 template void BatchedLOR_RT::Assemble2D<5>();
 template void BatchedLOR_RT::Assemble2D<6>();
 template void BatchedLOR_RT::Assemble2D<7>();
 template void BatchedLOR_RT::Assemble2D<8>();

 template void BatchedLOR_RT::Assemble3D<1>();
 template void BatchedLOR_RT::Assemble3D<2>();
 template void BatchedLOR_RT::Assemble3D<3>();
 template void BatchedLOR_RT::Assemble3D<4>();
 template void BatchedLOR_RT::Assemble3D<5>();
 template void BatchedLOR_RT::Assemble3D<6>();
 template void BatchedLOR_RT::Assemble3D<7>();
 template void BatchedLOR_RT::Assemble3D<8>();

 BatchedLOR_RT::BatchedLOR_RT(BilinearForm &a,
                              FiniteElementSpace &fes_ho_,
                              Vector &X_vert_,
                              Vector &sparse_ij_,
                              Array<int> &sparse_mapping_)
    : BatchedLORKernel(fes_ho_, X_vert_, sparse_ij_, sparse_mapping_)
 {
    ProjectLORCoefficient<VectorFEMassIntegrator>(a, c1);
    ProjectLORCoefficient<DivDivIntegrator>(a, c2);
 }

 } // namespace mfem
mfem::Array::HostReadWrite
T * HostReadWrite()
Shortcut for mfem::ReadWrite(a.GetMemory(), a.Size(), false).
Definition: array.hpp:327

mfem::BatchedLORKernel
Abstract base class for the batched LOR assembly kernels.
Definition: lor_batched.hpp:167

mfem::BatchedLORKernel::sparse_mapping
Array< int > & sparse_mapping
Local element sparsity pattern.
Definition: lor_batched.hpp:173

mfem::Vector::SetSize
void SetSize(int s)
Resize the vector to size s.
Definition: vector.hpp:512

AtomicAdd
MFEM_HOST_DEVICE T AtomicAdd(T &add, const T val)
Definition: backends.hpp:84

mfem::Vector::Size
int Size() const
Returns the size of the vector.
Definition: vector.hpp:199

mfem::Vector::Read
virtual const double * Read(bool on_dev=true) const
Shortcut for mfem::Read(vec.GetMemory(), vec.Size(), on_dev).
Definition: vector.hpp:448

mfem::BatchedLORKernel::c2
CoefficientVector c2
Coefficient of second integrator.
Definition: lor_batched.hpp:177

mfem::BatchedLOR_RT::BatchedLOR_RT
BatchedLOR_RT(BilinearForm &a, FiniteElementSpace &fes_ho_, Vector &X_vert_, Vector &sparse_ij_, Array< int > &sparse_mapping_)
Definition: lor_rt.cpp:568

mfem
Definition: CodeDocumentation.dox:1

mfem::Vector::Write
virtual double * Write(bool on_dev=true)
Shortcut for mfem::Write(vec.GetMemory(), vec.Size(), on_dev).
Definition: vector.hpp:456

mfem::Array< int >

mfem::BatchedLORKernel::sparse_ij
Vector & sparse_ij
Local element sparsity matrix data.
Definition: lor_batched.hpp:172

mfem::BatchedLOR_RT::Assemble2D
void Assemble2D()
Definition: lor_rt.cpp:21

mfem::BatchedLOR_RT::Assemble3D
void Assemble3D()
Definition: lor_rt.cpp:237

lor_rt.hpp

mfem::Det3D
MFEM_HOST_DEVICE double Det3D(DeviceMatrix &J)
Definition: lor_util.hpp:188

mfem::Det2D
MFEM_HOST_DEVICE double Det2D(DeviceMatrix &J)
Definition: lor_util.hpp:183

mfem::Jacobian3D
MFEM_HOST_DEVICE void Jacobian3D(const double x, const double y, const double z, const double vx[8], const double vy[8], const double vz[8], DeviceMatrix &J)
Definition: lor_util.hpp:126

mfem::BatchedLORKernel::fes_ho
FiniteElementSpace & fes_ho
The associated high-order space.
Definition: lor_batched.hpp:170

mfem::DeviceTensor
A basic generic Tensor class, appropriate for use on the GPU.
Definition: dtensor.hpp:81

mfem::FiniteElementSpace::GetNE
int GetNE() const
Returns number of elements in the mesh.
Definition: fespace.hpp:614

mfem::Jacobian2D
MFEM_HOST_DEVICE void Jacobian2D(const double x, const double y, const double vx[4], const double vy[4], DeviceMatrix &J)
Definition: lor_util.hpp:115

mfem::BatchedLORKernel::X_vert
Vector & X_vert
Mesh coordinate vector.
Definition: lor_batched.hpp:171

mfem::FiniteElementSpace
Class FiniteElementSpace - responsible for providing FEM view of the mesh, mainly managing the set of...
Definition: fespace.hpp:96

mfem::Array::SetSize
void SetSize(int nsize)
Change the logical size of the array, keep existing entries.
Definition: array.hpp:684

a
double a
Definition: lissajous.cpp:41

mfem::BilinearForm
A "square matrix" operator for the associated FE space and BLFIntegrators The sum of all the BLFInteg...
Definition: bilinearform.hpp:60

dim
int dim
Definition: ex24.cpp:53

lor_util.hpp

mfem::Vector
Vector data type.
Definition: vector.hpp:60

mfem::Reshape
MFEM_HOST_DEVICE DeviceTensor< sizeof...(Dims), T > Reshape(T *ptr, Dims... dims)
Wrap a pointer as a DeviceTensor with automatically deduced template parameters.
Definition: dtensor.hpp:131

mfem::BatchedLORKernel::c1
CoefficientVector c1
Coefficient of first integrator.
Definition: lor_batched.hpp:176