1// MFEM Example 5
3// Compile with: make ex5
5// Sample runs: ex5 -m ../data/square-disc.mesh
6// ex5 -m ../data/star.mesh
7// ex5 -m ../data/star.mesh -pa
8// ex5 -m ../data/beam-tet.mesh
9// ex5 -m ../data/beam-hex.mesh
10// ex5 -m ../data/beam-hex.mesh -pa
11// ex5 -m ../data/escher.mesh
12// ex5 -m ../data/fichera.mesh
14// Device sample runs:
15// ex5 -m ../data/star.mesh -pa -d cuda
16// ex5 -m ../data/star.mesh -pa -d raja-cuda
17// ex5 -m ../data/star.mesh -pa -d raja-omp
18// ex5 -m ../data/beam-hex.mesh -pa -d cuda
20// Description: This example code solves a simple 2D/3D mixed Darcy problem
21// corresponding to the saddle point system
23// k*u + grad p = f
24// - div u = g
26// with natural boundary condition -p = <given pressure>.
27// Here, we use a given exact solution (u,p) and compute the
28// corresponding r.h.s. (f,g). We discretize with Raviart-Thomas
29// finite elements (velocity u) and piecewise discontinuous
30// polynomials (pressure p).
32// The example demonstrates the use of the BlockOperator class, as
33// well as the collective saving of several grid functions in
34// VisIt ( and ParaView ( formats.
36// We recommend viewing examples 1-4 before viewing this example.
38#include "mfem.hpp"
39#include <fstream>
40#include <iostream>
41#include <algorithm>
43using namespace std;
44using namespace mfem;
46// Define the analytical solution and forcing terms / boundary conditions
47void uFun_ex(const Vector & x, Vector & u);
48real_t pFun_ex(const Vector & x);
49void fFun(const Vector & x, Vector & f);
50real_t gFun(const Vector & x);
51real_t f_natural(const Vector & x);
53int main(int argc, char *argv[])
55 StopWatch chrono;
57 // 1. Parse command-line options.
58 const char *mesh_file = "../data/star.mesh";
59 int order = 1;
60 bool pa = false;
61 const char *device_config = "cpu";
62 bool visualization = 1;
64 OptionsParser args(argc, argv);
65 args.AddOption(&mesh_file, "-m", "--mesh",
66 "Mesh file to use.");
67 args.AddOption(&order, "-o", "--order",
68 "Finite element order (polynomial degree).");
69 args.AddOption(&pa, "-pa", "--partial-assembly", "-no-pa",
70 "--no-partial-assembly", "Enable Partial Assembly.");
71 args.AddOption(&device_config, "-d", "--device",
72 "Device configuration string, see Device::Configure().");
73 args.AddOption(&visualization, "-vis", "--visualization", "-no-vis",
74 "--no-visualization",
75 "Enable or disable GLVis visualization.");
76 args.Parse();
77 if (!args.Good())
78 {
79 args.PrintUsage(cout);
80 return 1;
81 }
82 args.PrintOptions(cout);
84 // 2. Enable hardware devices such as GPUs, and programming models such as
85 // CUDA, OCCA, RAJA and OpenMP based on command line options.
86 Device device(device_config);
87 device.Print();
89 // 3. Read the mesh from the given mesh file. We can handle triangular,
90 // quadrilateral, tetrahedral, hexahedral, surface and volume meshes with
91 // the same code.
92 Mesh *mesh = new Mesh(mesh_file, 1, 1);
93 int dim = mesh->Dimension();
95 // 4. Refine the mesh to increase the resolution. In this example we do
96 // 'ref_levels' of uniform refinement. We choose 'ref_levels' to be the
97 // largest number that gives a final mesh with no more than 10,000
98 // elements.
99 {
100 int ref_levels =
101 (int)floor(log(10000./mesh->GetNE())/log(2.)/dim);
102 for (int l = 0; l < ref_levels; l++)
103 {
104 mesh->UniformRefinement();
105 }
106 }
108 // 5. Define a finite element space on the mesh. Here we use the
109 // Raviart-Thomas finite elements of the specified order.
110 FiniteElementCollection *hdiv_coll(new RT_FECollection(order, dim));
111 FiniteElementCollection *l2_coll(new L2_FECollection(order, dim));
113 FiniteElementSpace *R_space = new FiniteElementSpace(mesh, hdiv_coll);
114 FiniteElementSpace *W_space = new FiniteElementSpace(mesh, l2_coll);
116 // 6. Define the BlockStructure of the problem, i.e. define the array of
117 // offsets for each variable. The last component of the Array is the sum
118 // of the dimensions of each block.
119 Array<int> block_offsets(3); // number of variables + 1
120 block_offsets[0] = 0;
121 block_offsets[1] = R_space->GetVSize();
122 block_offsets[2] = W_space->GetVSize();
123 block_offsets.PartialSum();
125 std::cout << "***********************************************************\n";
126 std::cout << "dim(R) = " << block_offsets[1] - block_offsets[0] << "\n";
127 std::cout << "dim(W) = " << block_offsets[2] - block_offsets[1] << "\n";
128 std::cout << "dim(R+W) = " << block_offsets.Last() << "\n";
129 std::cout << "***********************************************************\n";
131 // 7. Define the coefficients, analytical solution, and rhs of the PDE.
132 ConstantCoefficient k(1.0);
141 // 8. Allocate memory (x, rhs) for the analytical solution and the right hand
142 // side. Define the GridFunction u,p for the finite element solution and
143 // linear forms fform and gform for the right hand side. The data
144 // allocated by x and rhs are passed as a reference to the grid functions
145 // (u,p) and the linear forms (fform, gform).
146 MemoryType mt = device.GetMemoryType();
147 BlockVector x(block_offsets, mt), rhs(block_offsets, mt);
149 LinearForm *fform(new LinearForm);
150 fform->Update(R_space, rhs.GetBlock(0), 0);
153 fform->Assemble();
154 fform->SyncAliasMemory(rhs);
156 LinearForm *gform(new LinearForm);
157 gform->Update(W_space, rhs.GetBlock(1), 0);
158 gform->AddDomainIntegrator(new DomainLFIntegrator(gcoeff));
159 gform->Assemble();
160 gform->SyncAliasMemory(rhs);
162 // 9. Assemble the finite element matrices for the Darcy operator
163 //
164 // D = [ M B^T ]
165 // [ B 0 ]
166 // where:
167 //
168 // M = \int_\Omega k u_h \cdot v_h d\Omega u_h, v_h \in R_h
169 // B = -\int_\Omega \div u_h q_h d\Omega u_h \in R_h, q_h \in W_h
170 BilinearForm *mVarf(new BilinearForm(R_space));
171 MixedBilinearForm *bVarf(new MixedBilinearForm(R_space, W_space));
173 if (pa) { mVarf->SetAssemblyLevel(AssemblyLevel::PARTIAL); }
175 mVarf->Assemble();
176 if (!pa) { mVarf->Finalize(); }
178 if (pa) { bVarf->SetAssemblyLevel(AssemblyLevel::PARTIAL); }
180 bVarf->Assemble();
181 if (!pa) { bVarf->Finalize(); }
183 BlockOperator darcyOp(block_offsets);
185 TransposeOperator *Bt = NULL;
187 if (pa)
188 {
189 Bt = new TransposeOperator(bVarf);
191 darcyOp.SetBlock(0,0, mVarf);
192 darcyOp.SetBlock(0,1, Bt, -1.0);
193 darcyOp.SetBlock(1,0, bVarf, -1.0);
194 }
195 else
196 {
197 SparseMatrix &M(mVarf->SpMat());
198 SparseMatrix &B(bVarf->SpMat());
199 B *= -1.;
200 Bt = new TransposeOperator(&B);
202 darcyOp.SetBlock(0,0, &M);
203 darcyOp.SetBlock(0,1, Bt);
204 darcyOp.SetBlock(1,0, &B);
205 }
207 // 10. Construct the operators for preconditioner
208 //
209 // P = [ diag(M) 0 ]
210 // [ 0 B diag(M)^-1 B^T ]
211 //
212 // Here we use Symmetric Gauss-Seidel to approximate the inverse of the
213 // pressure Schur Complement
214 SparseMatrix *MinvBt = NULL;
215 Vector Md(mVarf->Height());
217 BlockDiagonalPreconditioner darcyPrec(block_offsets);
218 Solver *invM, *invS;
219 SparseMatrix *S = NULL;
221 if (pa)
222 {
223 mVarf->AssembleDiagonal(Md);
224 auto Md_host = Md.HostRead();
225 Vector invMd(mVarf->Height());
226 for (int i=0; i<mVarf->Height(); ++i)
227 {
228 invMd(i) = 1.0 / Md_host[i];
229 }
231 Vector BMBt_diag(bVarf->Height());
232 bVarf->AssembleDiagonal_ADAt(invMd, BMBt_diag);
234 Array<int> ess_tdof_list; // empty
236 invM = new OperatorJacobiSmoother(Md, ess_tdof_list);
237 invS = new OperatorJacobiSmoother(BMBt_diag, ess_tdof_list);
238 }
239 else
240 {
241 SparseMatrix &M(mVarf->SpMat());
242 M.GetDiag(Md);
243 Md.HostReadWrite();
245 SparseMatrix &B(bVarf->SpMat());
246 MinvBt = Transpose(B);
248 for (int i = 0; i < Md.Size(); i++)
249 {
250 MinvBt->ScaleRow(i, 1./Md(i));
251 }
253 S = Mult(B, *MinvBt);
255 invM = new DSmoother(M);
258 invS = new GSSmoother(*S);
260 invS = new UMFPackSolver(*S);
262 }
264 invM->iterative_mode = false;
265 invS->iterative_mode = false;
267 darcyPrec.SetDiagonalBlock(0, invM);
268 darcyPrec.SetDiagonalBlock(1, invS);
270 // 11. Solve the linear system with MINRES.
271 // Check the norm of the unpreconditioned residual.
272 int maxIter(1000);
273 real_t rtol(1.e-6);
274 real_t atol(1.e-10);
276 chrono.Clear();
277 chrono.Start();
278 MINRESSolver solver;
279 solver.SetAbsTol(atol);
280 solver.SetRelTol(rtol);
281 solver.SetMaxIter(maxIter);
282 solver.SetOperator(darcyOp);
283 solver.SetPreconditioner(darcyPrec);
284 solver.SetPrintLevel(1);
285 x = 0.0;
286 solver.Mult(rhs, x);
287 if (device.IsEnabled()) { x.HostRead(); }
288 chrono.Stop();
290 if (solver.GetConverged())
291 {
292 std::cout << "MINRES converged in " << solver.GetNumIterations()
293 << " iterations with a residual norm of "
294 << solver.GetFinalNorm() << ".\n";
295 }
296 else
297 {
298 std::cout << "MINRES did not converge in " << solver.GetNumIterations()
299 << " iterations. Residual norm is " << solver.GetFinalNorm()
300 << ".\n";
301 }
302 std::cout << "MINRES solver took " << chrono.RealTime() << "s.\n";
304 // 12. Create the grid functions u and p. Compute the L2 error norms.
306 u.MakeRef(R_space, x.GetBlock(0), 0);
307 p.MakeRef(W_space, x.GetBlock(1), 0);
309 int order_quad = max(2, 2*order+1);
311 for (int i=0; i < Geometry::NumGeom; ++i)
312 {
313 irs[i] = &(IntRules.Get(i, order_quad));
314 }
316 real_t err_u = u.ComputeL2Error(ucoeff, irs);
317 real_t norm_u = ComputeLpNorm(2., ucoeff, *mesh, irs);
318 real_t err_p = p.ComputeL2Error(pcoeff, irs);
319 real_t norm_p = ComputeLpNorm(2., pcoeff, *mesh, irs);
321 std::cout << "|| u_h - u_ex || / || u_ex || = " << err_u / norm_u << "\n";
322 std::cout << "|| p_h - p_ex || / || p_ex || = " << err_p / norm_p << "\n";
324 // 13. Save the mesh and the solution. This output can be viewed later using
325 // GLVis: "glvis -m ex5.mesh -g" or "glvis -m ex5.mesh -g
326 //".
327 {
328 ofstream mesh_ofs("ex5.mesh");
329 mesh_ofs.precision(8);
330 mesh->Print(mesh_ofs);
332 ofstream u_ofs("");
333 u_ofs.precision(8);
334 u.Save(u_ofs);
336 ofstream p_ofs("");
337 p_ofs.precision(8);
338 p.Save(p_ofs);
339 }
341 // 14. Save data in the VisIt format
342 VisItDataCollection visit_dc("Example5", mesh);
343 visit_dc.RegisterField("velocity", &u);
344 visit_dc.RegisterField("pressure", &p);
345 visit_dc.Save();
347 // 15. Save data in the ParaView format
348 ParaViewDataCollection paraview_dc("Example5", mesh);
349 paraview_dc.SetPrefixPath("ParaView");
350 paraview_dc.SetLevelsOfDetail(order);
351 paraview_dc.SetCycle(0);
352 paraview_dc.SetDataFormat(VTKFormat::BINARY);
353 paraview_dc.SetHighOrderOutput(true);
354 paraview_dc.SetTime(0.0); // set the time
355 paraview_dc.RegisterField("velocity",&u);
356 paraview_dc.RegisterField("pressure",&p);
357 paraview_dc.Save();
359 // 16. Send the solution by socket to a GLVis server.
360 if (visualization)
361 {
362 char vishost[] = "localhost";
363 int visport = 19916;
365 u_sock.precision(8);
366 u_sock << "solution\n" << *mesh << u << "window_title 'Velocity'" << endl;
368 p_sock.precision(8);
369 p_sock << "solution\n" << *mesh << p << "window_title 'Pressure'" << endl;
370 }
372 // 17. Free the used memory.
373 delete fform;
374 delete gform;
375 delete invM;
376 delete invS;
377 delete S;
378 delete Bt;
379 delete MinvBt;
380 delete mVarf;
381 delete bVarf;
382 delete W_space;
383 delete R_space;
384 delete l2_coll;
385 delete hdiv_coll;
386 delete mesh;
388 return 0;
392void uFun_ex(const Vector & x, Vector & u)
394 real_t xi(x(0));
395 real_t yi(x(1));
396 real_t zi(0.0);
397 if (x.Size() == 3)
398 {
399 zi = x(2);
400 }
402 u(0) = - exp(xi)*sin(yi)*cos(zi);
403 u(1) = - exp(xi)*cos(yi)*cos(zi);
405 if (x.Size() == 3)
406 {
407 u(2) = exp(xi)*sin(yi)*sin(zi);
408 }
411// Change if needed
414 real_t xi(x(0));
415 real_t yi(x(1));
416 real_t zi(0.0);
418 if (x.Size() == 3)
419 {
420 zi = x(2);
421 }
423 return exp(xi)*sin(yi)*cos(zi);
426void fFun(const Vector & x, Vector & f)
428 f = 0.0;
433 if (x.Size() == 3)
434 {
435 return -pFun_ex(x);
436 }
437 else
438 {
439 return 0;
440 }
445 return (-pFun_ex(x));
