4.7/examples_2amgx_2ex1p_8cpp_source.html

//                       MFEM Example 1 - Parallel Version

//                              AmgX Modification

//

// Compile with: make ex1p

//

// AmgX sample runs:

//               mpirun -np 4 ex1p

//               mpirun -np 4 ex1p -d cuda

//               mpirun -np 10 ex1p --amgx-file amg_pcg.json --amgx-mpi-teams

//               mpirun -np 4 ex1p --amgx-file amg_pcg.json

//

// Description:  This example code demonstrates the use of MFEM to define a

//               simple finite element discretization of the Laplace problem

//               -Delta u = 1 with homogeneous Dirichlet boundary conditions.

//               Specifically, we discretize using a FE space of the specified

//               order, or if order < 1 using an isoparametric/isogeometric

//               space (i.e. quadratic for quadratic curvilinear mesh, NURBS for

//               NURBS mesh, etc.)

//

//               The example highlights the use of mesh refinement, finite

//               element grid functions, as well as linear and bilinear forms

//               corresponding to the left-hand side and right-hand side of the

//               discrete linear system. We also cover the explicit elimination

//               of essential boundary conditions, static condensation, and the

//               optional connection to the GLVis tool for visualization.


#include "mfem.hpp"

#include <fstream>

#include <iostream>


using namespace std;

using namespace mfem;


#ifndef MFEM_USE_AMGX

#error This example requires that MFEM is built with MFEM_USE_AMGX=YES

#endif


int main(int argc, char *argv[])

{

   // 1. Initialize MPI and HYPRE.

   Mpi::Init(argc, argv);

   int num_procs = Mpi::WorldSize();

   int myid = Mpi::WorldRank();

   Hypre::Init();


   // 2. Parse command-line options.

   const char *mesh_file = "../../data/star.mesh";

   int order = 1;

   bool static_cond = false;

   bool pa = false;

   const char *device_config = "cpu";

   bool visualization = true;

   bool amgx_lib = true;

   bool amgx_mpi_teams = false;

   const char* amgx_json_file = ""; // JSON file for AmgX

   int ndevices = 1;


   OptionsParser args(argc, argv);

   args.AddOption(&mesh_file, "-m", "--mesh",

                  "Mesh file to use.");

   args.AddOption(&order, "-o", "--order",

                  "Finite element order (polynomial degree) or -1 for"

                  " isoparametric space.");

   args.AddOption(&static_cond, "-sc", "--static-condensation", "-no-sc",

                  "--no-static-condensation", "Enable static condensation.");

   args.AddOption(&pa, "-pa", "--partial-assembly", "-no-pa",

                  "--no-partial-assembly", "Enable Partial Assembly.");

   args.AddOption(&amgx_lib, "-amgx", "--amgx-lib", "-no-amgx",

                  "--no-amgx-lib", "Use AmgX in example.");

   args.AddOption(&amgx_json_file, "--amgx-file", "--amgx-file",

                  "AMGX solver config file (overrides --amgx-solver, --amgx-verbose)");

   args.AddOption(&amgx_mpi_teams, "--amgx-mpi-teams", "--amgx-mpi-teams",

                  "--amgx-mpi-gpu-exclusive", "--amgx-mpi-gpu-exclusive",

                  "Create MPI teams when using AmgX to load balance between ranks and GPUs.");

   args.AddOption(&device_config, "-d", "--device",

                  "Device configuration string, see Device::Configure().");

   args.AddOption(&visualization, "-vis", "--visualization", "-no-vis",

                  "--no-visualization",

                  "Enable or disable GLVis visualization.");

   args.AddOption(&ndevices, "-nd","--gpus-per-node-in-teams-mode",

                  "Number of GPU devices per node (Only used if amgx_mpi_teams is true).");


   args.Parse();

   if (!args.Good())

   {

      if (myid == 0)

      {

         args.PrintUsage(cout);

      }

      return 1;

   }

   if (myid == 0)

   {

      args.PrintOptions(cout);

   }


   // 3. Enable hardware devices such as GPUs, and programming models such as

   //    CUDA, OCCA, RAJA and OpenMP based on command line options.

   Device device(device_config);

   if (myid == 0) { device.Print(); }


   // 4. Read the (serial) mesh from the given mesh file on all processors.  We

   //    can handle triangular, quadrilateral, tetrahedral, hexahedral, surface

   //    and volume meshes with the same code.

   Mesh mesh(mesh_file, 1, 1);

   int dim = mesh.Dimension();


   // 5. Refine the serial mesh on all processors to increase the resolution. In

   //    this example we do 'ref_levels' of uniform refinement. We choose

   //    'ref_levels' to be the largest number that gives a final mesh with no

   //    more than 10,000 elements.

   {

      int ref_levels =

         (int)floor(log(10000./mesh.GetNE())/log(2.)/dim);

      for (int l = 0; l < ref_levels; l++)

      {

         mesh.UniformRefinement();

      }

   }


   // 6. Define a parallel mesh by a partitioning of the serial mesh. Refine

   //    this mesh further in parallel to increase the resolution. Once the

   //    parallel mesh is defined, the serial mesh can be deleted.

   ParMesh pmesh(MPI_COMM_WORLD, mesh);

   mesh.Clear();

   {

      int par_ref_levels = 2;

      for (int l = 0; l < par_ref_levels; l++)

      {

         pmesh.UniformRefinement();

      }

   }


   // 7. Define a parallel finite element space on the parallel mesh. Here we

   //    use continuous Lagrange finite elements of the specified order. If

   //    order < 1, we instead use an isoparametric/isogeometric space.

   FiniteElementCollection *fec;

   bool delete_fec;

   if (order > 0)

   {

      fec = new H1_FECollection(order, dim);

      delete_fec = true;

   }

   else if (pmesh.GetNodes())

   {

      fec = pmesh.GetNodes()->OwnFEC();

      delete_fec = false;

      if (myid == 0)

      {

         cout << "Using isoparametric FEs: " << fec->Name() << endl;

      }

   }

   else

   {

      fec = new H1_FECollection(order = 1, dim);

      delete_fec = true;

   }

   ParFiniteElementSpace fespace(&pmesh, fec);

   HYPRE_BigInt size = fespace.GlobalTrueVSize();

   if (myid == 0)

   {

      cout << "Number of finite element unknowns: " << size << endl;

   }


   // 8. Determine the list of true (i.e. parallel conforming) essential

   //    boundary dofs. In this example, the boundary conditions are defined

   //    by marking all the boundary attributes from the mesh as essential

   //    (Dirichlet) and converting them to a list of true dofs.

   Array<int> ess_tdof_list;

   if (pmesh.bdr_attributes.Size())

   {

      Array<int> ess_bdr(pmesh.bdr_attributes.Max());

      ess_bdr = 1;

      fespace.GetEssentialTrueDofs(ess_bdr, ess_tdof_list);

   }


   // 9. Set up the parallel linear form b(.) which corresponds to the

   //    right-hand side of the FEM linear system, which in this case is

   //    (1,phi_i) where phi_i are the basis functions in fespace.

   ParLinearForm b(&fespace);

   ConstantCoefficient one(1.0);

   b.AddDomainIntegrator(new DomainLFIntegrator(one));

   b.Assemble();


   // 10. Define the solution vector x as a parallel finite element grid function

   //     corresponding to fespace. Initialize x with initial guess of zero,

   //     which satisfies the boundary conditions.

   ParGridFunction x(&fespace);

   x = 0.0;


   // 11. Set up the parallel bilinear form a(.,.) on the finite element space

   //     corresponding to the Laplacian operator -Delta, by adding the Diffusion

   //     domain integrator.

   ParBilinearForm a(&fespace);

   if (pa) { a.SetAssemblyLevel(AssemblyLevel::PARTIAL); }

   a.AddDomainIntegrator(new DiffusionIntegrator(one));


   // 12. Assemble the parallel bilinear form and the corresponding linear

   //     system, applying any necessary transformations such as: parallel

   //     assembly, eliminating boundary conditions, applying conforming

   //     constraints for non-conforming AMR, static condensation, etc.

   if (static_cond) { a.EnableStaticCondensation(); }

   a.Assemble();


   OperatorPtr A;

   Vector B, X;

   a.FormLinearSystem(ess_tdof_list, x, b, A, X, B);


   // 13. Solve the linear system A X = B.

   //     * With full assembly, use the BoomerAMG preconditioner from hypre.

   //     * If AmgX is available solve using amg preconditioner.

   //     * With partial assembly, use Jacobi smoothing, for now.

   Solver *prec = NULL;

   if (pa)

   {

      if (UsesTensorBasis(fespace))

      {

         prec = new OperatorJacobiSmoother(a, ess_tdof_list);

      }


      CGSolver cg(MPI_COMM_WORLD);

      cg.SetRelTol(1e-12);

      cg.SetMaxIter(2000);

      cg.SetPrintLevel(1);

      if (prec) { cg.SetPreconditioner(*prec); }

      cg.SetOperator(*A);

      cg.Mult(B, X);

      delete prec;

   }

   else if (amgx_lib && strcmp(amgx_json_file,"") == 0)

   {

      MFEM_VERIFY(!amgx_mpi_teams,

                  "Please add JSON file to try AmgX with MPI teams mode");


      bool amgx_verbose = false;

      prec = new AmgXSolver(MPI_COMM_WORLD, AmgXSolver::PRECONDITIONER,

                            amgx_verbose);


      CGSolver cg(MPI_COMM_WORLD);

      cg.SetRelTol(1e-12);

      cg.SetMaxIter(2000);

      cg.SetPrintLevel(1);

      if (prec) { cg.SetPreconditioner(*prec); }

      cg.SetOperator(*A);

      cg.Mult(B, X);

      delete prec;


   }

   else if (amgx_lib && strcmp(amgx_json_file,"") != 0)

   {

      AmgXSolver amgx;

      amgx.ReadParameters(amgx_json_file, AmgXSolver::EXTERNAL);


      if (amgx_mpi_teams)

      {

         // Forms MPI teams to load balance between MPI ranks and GPUs

         amgx.InitMPITeams(MPI_COMM_WORLD, ndevices);

      }

      else

      {

         // Assumes each MPI rank is paired with a GPU

         amgx.InitExclusiveGPU(MPI_COMM_WORLD);

      }


      amgx.SetOperator(*A.As<HypreParMatrix>());

      amgx.SetConvergenceCheck(true);

      amgx.Mult(B, X);


      // Release MPI communicators and resources created by AmgX

      amgx.Finalize();

   }

   else

   {

      prec = new HypreBoomerAMG;


      CGSolver cg(MPI_COMM_WORLD);

      cg.SetRelTol(1e-12);

      cg.SetMaxIter(2000);

      cg.SetPrintLevel(1);

      if (prec) { cg.SetPreconditioner(*prec); }

      cg.SetOperator(*A);

      cg.Mult(B, X);

      delete prec;

   }


   // 14. Recover the parallel grid function corresponding to X. This is the

   //     local finite element solution on each processor.

   a.RecoverFEMSolution(X, b, x);


   // 15. Save the refined mesh and the solution in parallel. This output can

   //     be viewed later using GLVis: "glvis -np <np> -m mesh -g sol".

   {

      ostringstream mesh_name, sol_name;

      mesh_name << "mesh." << setfill('0') << setw(6) << myid;

      sol_name << "sol." << setfill('0') << setw(6) << myid;


      ofstream mesh_ofs(mesh_name.str().c_str());

      mesh_ofs.precision(8);

      pmesh.Print(mesh_ofs);


      ofstream sol_ofs(sol_name.str().c_str());

      sol_ofs.precision(8);

      x.Save(sol_ofs);

   }


   // 16. Send the solution by socket to a GLVis server.

   if (visualization)

   {

      char vishost[] = "localhost";

      int  visport   = 19916;

      socketstream sol_sock(vishost, visport);

      sol_sock << "parallel " << num_procs << " " << myid << "\n";

      sol_sock.precision(8);

      sol_sock << "solution\n" << pmesh << x << flush;

   }


   // 17. Free the used memory.

   if (delete_fec)

   {

      delete fec;

   }


   return 0;

}


mfem::AmgXSolver
MFEM wrapper for Nvidia's multigrid library, AmgX (github.com/NVIDIA/AMGX)
Definition amgxsolver.hpp:70

mfem::AmgXSolver::EXTERNAL
@ EXTERNAL
Configure will be read from a specified file.
Definition amgxsolver.hpp:98

mfem::AmgXSolver::Finalize
void Finalize()
Close down the AmgX library and free up any MPI Comms set up for it.
Definition amgxsolver.cpp:994

mfem::AmgXSolver::SetOperator
virtual void SetOperator(const Operator &op)
Sets the Operator that is going to be solved via AmgX. Supports operators based on either an MFEM Spa...
Definition amgxsolver.cpp:863

mfem::AmgXSolver::PRECONDITIONER
@ PRECONDITIONER
Definition amgxsolver.hpp:83

mfem::AmgXSolver::SetConvergenceCheck
void SetConvergenceCheck(bool setConvergenceCheck_=true)
Add a check for convergence after applying Mult.
Definition amgxsolver.cpp:197

mfem::AmgXSolver::InitMPITeams
void InitMPITeams(const MPI_Comm &comm, const int nDevs)
Initialize the AmgX library and create MPI teams based on the number of devices on each node nDevs....
Definition amgxsolver.cpp:153

mfem::AmgXSolver::Mult
virtual void Mult(const Vector &b, Vector &x) const
Utilize the AmgX library to solve the linear system where the "matrix" is the AMG approximation to th...
Definition amgxsolver.cpp:906

mfem::AmgXSolver::ReadParameters
void ReadParameters(const std::string config, CONFIG_SRC source)
Read in the AmgX parameters either through a file or directly through a properly formated string....
Definition amgxsolver.cpp:190

mfem::AmgXSolver::InitExclusiveGPU
void InitExclusiveGPU(const MPI_Comm &comm)
Initialize the AmgX library in parallel mode with exactly one GPU per rank after the solver configura...
Definition amgxsolver.cpp:124

mfem::Array
Definition array.hpp:46

mfem::Array::Max
T Max() const
Find the maximal element in the array, using the comparison operator < for class T.
Definition array.cpp:68

mfem::Array::Size
int Size() const
Return the logical size of the array.
Definition array.hpp:144

mfem::CGSolver
Conjugate gradient method.
Definition solvers.hpp:513

mfem::CGSolver::SetOperator
virtual void SetOperator(const Operator &op)
Also calls SetOperator for the preconditioner if there is one.
Definition solvers.hpp:526

mfem::CGSolver::Mult
virtual void Mult(const Vector &b, Vector &x) const
Iterative solution of the linear system using the Conjugate Gradient method.
Definition solvers.cpp:718

mfem::ConstantCoefficient
A coefficient that is constant across space and time.
Definition coefficient.hpp:85

mfem::Device
The MFEM Device class abstracts hardware devices such as GPUs, as well as programming models such as ...
Definition device.hpp:123

mfem::Device::Print
void Print(std::ostream &out=mfem::out)
Print the configuration of the MFEM virtual device object.
Definition device.cpp:286

mfem::DiffusionIntegrator
Definition bilininteg.hpp:2129

mfem::DomainLFIntegrator
Class for domain integration .
Definition lininteg.hpp:109

mfem::FiniteElementCollection
Collection of finite elements from the same family in multiple dimensions. This class is used to matc...
Definition fe_coll.hpp:27

mfem::FiniteElementCollection::Name
virtual const char * Name() const
Definition fe_coll.hpp:79

mfem::H1_FECollection
Arbitrary order H1-conforming (continuous) finite elements.
Definition fe_coll.hpp:260

mfem::HypreBoomerAMG
The BoomerAMG solver in hypre.
Definition hypre.hpp:1691

mfem::HypreParMatrix
Wrapper for hypre's ParCSR matrix class.
Definition hypre.hpp:388

mfem::Hypre::Init
static void Init()
Initialize hypre by calling HYPRE_Init() and set default options. After calling Hypre::Init(),...
Definition hypre.hpp:74

mfem::IterativeSolver::SetRelTol
void SetRelTol(real_t rtol)
Definition solvers.hpp:209

mfem::IterativeSolver::SetPreconditioner
virtual void SetPreconditioner(Solver &pr)
This should be called before SetOperator.
Definition solvers.cpp:173

mfem::IterativeSolver::SetPrintLevel
virtual void SetPrintLevel(int print_lvl)
Legacy method to set the level of verbosity of the solver output.
Definition solvers.cpp:71

mfem::IterativeSolver::SetMaxIter
void SetMaxIter(int max_it)
Definition solvers.hpp:211

mfem::Mesh
Mesh data type.
Definition mesh.hpp:56

mfem::Mesh::bdr_attributes
Array< int > bdr_attributes
A list of all unique boundary attributes used by the Mesh.
Definition mesh.hpp:282

mfem::Mesh::Clear
void Clear()
Clear the contents of the Mesh.
Definition mesh.hpp:730

mfem::Mesh::GetNE
int GetNE() const
Returns number of elements.
Definition mesh.hpp:1226

mfem::Mesh::Dimension
int Dimension() const
Dimension of the reference space used within the elements.
Definition mesh.hpp:1160

mfem::Mesh::GetNodes
void GetNodes(Vector &node_coord) const
Definition mesh.cpp:8973

mfem::Mesh::UniformRefinement
void UniformRefinement(int i, const DSTable &, int *, int *, int *)
Definition mesh.cpp:10970

mfem::Mpi::WorldRank
static int WorldRank()
Return the MPI rank in MPI_COMM_WORLD.
Definition communication.hpp:82

mfem::Mpi::WorldSize
static int WorldSize()
Return the size of MPI_COMM_WORLD.
Definition communication.hpp:89

mfem::Mpi::Init
static void Init(int &argc, char **&argv, int required=default_thread_required, int *provided=nullptr)
Singleton creation with Mpi::Init(argc, argv).
Definition communication.hpp:35

mfem::OperatorHandle
Pointer to an Operator of a specified type.
Definition handle.hpp:34

mfem::OperatorHandle::As
OpType * As() const
Return the Operator pointer statically cast to a specified OpType. Similar to the method Get().
Definition handle.hpp:104

mfem::OperatorJacobiSmoother
Jacobi smoothing for a given bilinear form (no matrix necessary).
Definition solvers.hpp:313

mfem::Operator::RecoverFEMSolution
virtual void RecoverFEMSolution(const Vector &X, const Vector &b, Vector &x)
Reconstruct a solution vector x (e.g. a GridFunction) from the solution X of a constrained linear sys...
Definition operator.cpp:148

mfem::OptionsParser
Definition optparser.hpp:32

mfem::OptionsParser::Parse
void Parse()
Parse the command-line options. Note that this function expects all the options provided through the ...
Definition optparser.cpp:151

mfem::OptionsParser::PrintUsage
void PrintUsage(std::ostream &out) const
Print the usage message.
Definition optparser.cpp:462

mfem::OptionsParser::PrintOptions
void PrintOptions(std::ostream &out) const
Print the options.
Definition optparser.cpp:331

mfem::OptionsParser::AddOption
void AddOption(bool *var, const char *enable_short_name, const char *enable_long_name, const char *disable_short_name, const char *disable_long_name, const char *description, bool required=false)
Add a boolean option and set 'var' to receive the value. Enable/disable tags are used to set the bool...
Definition optparser.hpp:82

mfem::OptionsParser::Good
bool Good() const
Return true if the command line options were parsed successfully.
Definition optparser.hpp:159

mfem::ParBilinearForm
Class for parallel bilinear form.
Definition pbilinearform.hpp:29

mfem::ParFiniteElementSpace
Abstract parallel finite element space.
Definition pfespace.hpp:29

mfem::ParFiniteElementSpace::GetEssentialTrueDofs
void GetEssentialTrueDofs(const Array< int > &bdr_attr_is_ess, Array< int > &ess_tdof_list, int component=-1) const override
Definition pfespace.cpp:1031

mfem::ParFiniteElementSpace::GlobalTrueVSize
HYPRE_BigInt GlobalTrueVSize() const
Definition pfespace.hpp:285

mfem::ParGridFunction
Class for parallel grid function.
Definition pgridfunc.hpp:33

mfem::ParGridFunction::Save
void Save(std::ostream &out) const override
Definition pgridfunc.cpp:932

mfem::ParLinearForm
Class for parallel linear form.
Definition plinearform.hpp:27

mfem::ParMesh
Class for parallel meshes.
Definition pmesh.hpp:34

mfem::ParMesh::Print
void Print(std::ostream &out=mfem::out, const std::string &comments="") const override
Definition pmesh.cpp:4801

mfem::Solver
Base class for solvers.
Definition operator.hpp:683

mfem::Vector
Vector data type.
Definition vector.hpp:80

mfem::socketstream
Definition socketstream.hpp:211

dim
int dim
Definition ex24.cpp:53

main
int main()
Definition get_mumps_version.cpp:25

HYPRE_BigInt
HYPRE_Int HYPRE_BigInt
Definition hypre_parcsr.hpp:27

b
real_t b
Definition lissajous.cpp:42

a
real_t a
Definition lissajous.cpp:41

mfem.hpp

mfem
Definition CodeDocumentation.dox:1

mfem::visport
const int visport
Definition extrapolator.cpp:22

mfem::UsesTensorBasis
bool UsesTensorBasis(const FiniteElementSpace &fes)
Return true if the mesh contains only one topology and the elements are tensor elements.
Definition fespace.hpp:1345

mfem::vishost
const char vishost[]
Definition extrapolator.cpp:21