4.0/device_8cpp_source.html

 // Copyright (c) 2010, Lawrence Livermore National Security, LLC. Produced at

 // the Lawrence Livermore National Laboratory. LLNL-CODE-443211. All Rights

 // reserved. See file COPYRIGHT for details.

 //

 // This file is part of the MFEM library. For more information and source code

 // availability see http://mfem.org.

 //

 // MFEM is free software; you can redistribute it and/or modify it under the

 // terms of the GNU Lesser General Public License (as published by the Free

 // Software Foundation) version 2.1 dated February 1999.


 #include "forall.hpp"

 #include "cuda.hpp"

 #include "occa.hpp"


 #include <string>

 #include <map>


 namespace mfem

 {


 // Place the following variables in the mfem::internal namespace, so that they

 // will not be included in the doxygen documentation.

 namespace internal

 {


 #ifdef MFEM_USE_OCCA

 // Default occa::device used by MFEM.

 occa::device occaDevice;

 #endif


 // Backends listed by priority, high to low:

 static const Backend::Id backend_list[Backend::NUM_BACKENDS] =

 {

    Backend::OCCA_CUDA, Backend::RAJA_CUDA, Backend::CUDA,

    Backend::OCCA_OMP, Backend::RAJA_OMP, Backend::OMP,

    Backend::OCCA_CPU, Backend::RAJA_CPU, Backend::CPU

 };


 // Backend names listed by priority, high to low:

 static const char *backend_name[Backend::NUM_BACKENDS] =

 {

    "occa-cuda", "raja-cuda", "cuda", "occa-omp", "raja-omp", "omp",

    "occa-cpu", "raja-cpu", "cpu"

 };


 } // namespace mfem::internal


 // Initialize the unique global Device variable.

 Device Device::device_singleton;


 Device::~Device()

 {

    if (destroy_mm) { mm.Destroy(); }

 }


 void Device::Configure(const std::string &device, const int dev)

 {

    std::map<std::string, Backend::Id> bmap;

    for (int i = 0; i < Backend::NUM_BACKENDS; i++)

    {

       bmap[internal::backend_name[i]] = internal::backend_list[i];

    }

    std::string::size_type beg = 0, end;

    while (1)

    {

       end = device.find(',', beg);

       end = (end != std::string::npos) ? end : device.size();

       const std::string bname = device.substr(beg, end - beg);

       std::map<std::string, Backend::Id>::iterator it = bmap.find(bname);

       MFEM_VERIFY(it != bmap.end(), "invalid backend name: '" << bname << '\'');

       Get().MarkBackend(it->second);

       if (end == device.size()) { break; }

       beg = end + 1;

    }


    // OCCA_CUDA needs CUDA or RAJA_CUDA:

    if (Allows(Backend::OCCA_CUDA) && !Allows(Backend::RAJA_CUDA))

    {

       Get().MarkBackend(Backend::CUDA);

    }


    // Perform setup.

    Get().Setup(dev);


    // Enable the device

    Enable();


    // Copy all data members from the global 'singleton_device' into '*this'.

    std::memcpy(this, &Get(), sizeof(Device));


    // Only '*this' will call the MemoryManager::Destroy() method.

    destroy_mm = true;

 }


 void Device::Print(std::ostream &out)

 {

    out << "Device configuration: ";

    bool add_comma = false;

    for (int i = 0; i < Backend::NUM_BACKENDS; i++)

    {

       if (backends & internal::backend_list[i])

       {

          if (add_comma) { out << ','; }

          add_comma = true;

          out << internal::backend_name[i];

       }

    }

    out << '\n';

 }


 void Device::UpdateMemoryTypeAndClass()

 {

    if (Device::Allows(Backend::CUDA_MASK))

    {

       mem_type = MemoryType::CUDA;

       mem_class = MemoryClass::CUDA;

    }

    else

    {

       mem_type = MemoryType::HOST;

       mem_class = MemoryClass::HOST;

    }

 }


 void Device::Enable()

 {

    if (Get().backends & ~Backend::CPU)

    {

       Get().mode = Device::ACCELERATED;

       Get().UpdateMemoryTypeAndClass();

    }

 }


 #ifdef MFEM_USE_CUDA

 static void DeviceSetup(const int dev, int &ngpu)

 {

    MFEM_CUDA_CHECK(cudaGetDeviceCount(&ngpu));

    MFEM_VERIFY(ngpu > 0, "No CUDA device found!");

    MFEM_CUDA_CHECK(cudaSetDevice(dev));

 }

 #endif


 static void CudaDeviceSetup(const int dev, int &ngpu)

 {

 #ifdef MFEM_USE_CUDA

    DeviceSetup(dev, ngpu);

 #endif

 }


 static void RajaDeviceSetup(const int dev, int &ngpu)

 {

 #ifdef MFEM_USE_CUDA

    if (ngpu <= 0) { DeviceSetup(dev, ngpu); }

 #endif

 }


 static void OccaDeviceSetup(const int dev)

 {

 #ifdef MFEM_USE_OCCA

    const int cpu  = Device::Allows(Backend::OCCA_CPU);

    const int omp  = Device::Allows(Backend::OCCA_OMP);

    const int cuda = Device::Allows(Backend::OCCA_CUDA);

    if (cpu + omp + cuda > 1)

    {

       MFEM_ABORT("Only one OCCA backend can be configured at a time!");

    }

    if (cuda)

    {

 #if OCCA_CUDA_ENABLED

       std::string mode("mode: 'CUDA', device_id : ");

       internal::occaDevice.setup(mode.append(1,'0'+dev));

 #else

       MFEM_ABORT("the OCCA CUDA backend requires OCCA built with CUDA!");

 #endif

    }

    else if (omp)

    {

 #if OCCA_OPENMP_ENABLED

       internal::occaDevice.setup("mode: 'OpenMP'");

 #else

       MFEM_ABORT("the OCCA OpenMP backend requires OCCA built with OpenMP!");

 #endif

    }

    else

    {

       internal::occaDevice.setup("mode: 'Serial'");

    }


    std::string mfemDir;

    if (occa::io::exists(MFEM_INSTALL_DIR "/include/mfem/"))

    {

       mfemDir = MFEM_INSTALL_DIR "/include/mfem/";

    }

    else if (occa::io::exists(MFEM_SOURCE_DIR))

    {

       mfemDir = MFEM_SOURCE_DIR;

    }

    else

    {

       MFEM_ABORT("Cannot find OCCA kernels in MFEM_INSTALL_DIR or MFEM_SOURCE_DIR");

    }


    occa::io::addLibraryPath("mfem", mfemDir);

    occa::loadKernels("mfem");

 #else

    MFEM_ABORT("the OCCA backends require MFEM built with MFEM_USE_OCCA=YES");

 #endif

 }


 void Device::Setup(const int device)

 {

    MFEM_VERIFY(ngpu == -1, "the mfem::Device is already configured!");


    ngpu = 0;

    dev = device;


 #ifndef MFEM_USE_CUDA

    MFEM_VERIFY(!Allows(Backend::CUDA_MASK),

                "the CUDA backends require MFEM built with MFEM_USE_CUDA=YES");

 #endif

 #ifndef MFEM_USE_RAJA

    MFEM_VERIFY(!Allows(Backend::RAJA_MASK),

                "the RAJA backends require MFEM built with MFEM_USE_RAJA=YES");

 #endif

 #ifndef MFEM_USE_OPENMP

    MFEM_VERIFY(!Allows(Backend::OMP|Backend::RAJA_OMP),

                "the OpenMP and RAJA OpenMP backends require MFEM built with"

                " MFEM_USE_OPENMP=YES");

 #endif

    if (Allows(Backend::CUDA)) { CudaDeviceSetup(dev, ngpu); }

    if (Allows(Backend::RAJA_CUDA)) { RajaDeviceSetup(dev, ngpu); }

    // The check for MFEM_USE_OCCA is in the function OccaDeviceSetup().

    if (Allows(Backend::OCCA_MASK)) { OccaDeviceSetup(dev); }

 }


 } // mfem

mfem::Backend::OMP
[host] OpenMP backend. Enabled when MFEM_USE_OPENMP = YES.
Definition: device.hpp:35

mfem::Device::~Device
~Device()
Destructor.
Definition: device.cpp:54

mfem::MemoryClass::CUDA
Memory types: { CUDA, CUDA_UVM }.

mfem::Device::Print
void Print(std::ostream &out=mfem::out)
Print the configuration of the MFEM virtual device object.
Definition: device.cpp:98

mfem::Device::Configure
void Configure(const std::string &device, const int dev=0)
Configure the Device backends.
Definition: device.cpp:59

mfem::Backend::OCCA_CUDA
[device] OCCA CUDA backend. Enabled when MFEM_USE_OCCA = YES and MFEM_USE_CUDA = YES.
Definition: device.hpp:54

mfem::Backend::RAJA_CPU
[host] RAJA CPU backend: sequential execution on each MPI rank. Enabled when MFEM_USE_RAJA = YES...
Definition: device.hpp:40

occa.hpp

mfem::Backend::RAJA_OMP
[host] RAJA OpenMP backend. Enabled when MFEM_USE_RAJA = YES and MFEM_USE_OPENMP = YES...
Definition: device.hpp:43

mfem::Backend::NUM_BACKENDS
Number of backends: from (1 &lt;&lt; 0) to (1 &lt;&lt; (NUM_BACKENDS-1)).
Definition: device.hpp:62

mfem::MemoryManager::Destroy
void Destroy()
Definition: mem_manager.cpp:108

mfem::Backend::OCCA_OMP
[host] OCCA OpenMP backend. Enabled when MFEM_USE_OCCA = YES.
Definition: device.hpp:51

mfem::Backend::CPU
[host] Default CPU backend: sequential execution on each MPI rank.
Definition: device.hpp:33

mfem::Backend::CUDA_MASK
Biwise-OR of all CUDA backends.
Definition: device.hpp:67

cuda.hpp

mfem::MemoryType::CUDA
cudaMalloc, cudaFree

mfem::Device::Allows
static bool Allows(unsigned long b_mask)
Return true if any of the backends in the backend mask, b_mask, are allowed.
Definition: device.hpp:204

mfem::mm
MemoryManager mm
The (single) global memory manager object.
Definition: mem_manager.cpp:709

mfem::MemoryType::HOST
Host memory; using new[] and delete[].

mfem::Backend::OCCA_MASK
Biwise-OR of all OCCA backends.
Definition: device.hpp:76

mfem::Backend::Id
Id
In the documentation below, we use square brackets to indicate the type of the backend: host or devic...
Definition: device.hpp:30

mfem::Backend::RAJA_MASK
Biwise-OR of all RAJA backends.
Definition: device.hpp:74

mfem::out
OutStream out(std::cout)
Global stream used by the library for standard output. Initially it uses the same std::streambuf as s...
Definition: globals.hpp:64

mfem::Device
The MFEM Device class abstracts hardware devices such as GPUs, as well as programming models such as ...
Definition: device.hpp:96

mfem::Backend::RAJA_CUDA
[device] RAJA CUDA backend. Enabled when MFEM_USE_RAJA = YES and MFEM_USE_CUDA = YES.
Definition: device.hpp:46

forall.hpp

mfem::Backend::OCCA_CPU
[host] OCCA CPU backend: sequential execution on each MPI rank. Enabled when MFEM_USE_OCCA = YES...
Definition: device.hpp:49

mfem::Backend::CUDA
[device] CUDA backend. Enabled when MFEM_USE_CUDA = YES.
Definition: device.hpp:37