4.9/device_8hpp_source.html

// Copyright (c) 2010-2025, Lawrence Livermore National Security, LLC. Produced

// at the Lawrence Livermore National Laboratory. All Rights reserved. See files

// LICENSE and NOTICE for details. LLNL-CODE-806117.

//

// This file is part of the MFEM library. For more information and source code

// availability visit https://mfem.org.

//

// MFEM is free software; you can redistribute it and/or modify it under the

// terms of the BSD-3 license. We welcome feedback and contributions, see file

// CONTRIBUTING.md for details.


#ifndef MFEM_DEVICE_HPP

#define MFEM_DEVICE_HPP


#include "enzyme.hpp"

#include "globals.hpp"

#include "mem_manager.hpp"


#include <string>


namespace mfem

{


/// MFEM backends.

/** Individual backends will generally implement only a subset of the kernels

    implemented by the default CPU backend. The goal of the backends is to

    accelerate data-parallel portions of the code and they can use a device

    memory space (e.g. GPUs) or share the memory space of the host (OpenMP). */


struct Backend

{

   /** @brief In the documentation below, we use square brackets to indicate the

       type of the backend: host or device. */


   enum Id: unsigned long

   {

      /// [host] Default CPU backend: sequential execution on each MPI rank.

      CPU = 1 << 0,

      /// [host] OpenMP backend. Enabled when MFEM_USE_OPENMP = YES.

      OMP = 1 << 1,

      /// [device] CUDA backend. Enabled when MFEM_USE_CUDA = YES.

      CUDA = 1 << 2,

      /// [device] HIP backend. Enabled when MFEM_USE_HIP = YES.

      HIP = 1 << 3,

      /** @brief [host] RAJA CPU backend: sequential execution on each MPI rank.

          Enabled when MFEM_USE_RAJA = YES. */

      RAJA_CPU = 1 << 4,

      /** @brief [host] RAJA OpenMP backend. Enabled when MFEM_USE_RAJA = YES

          and MFEM_USE_OPENMP = YES. */

      RAJA_OMP = 1 << 5,

      /** @brief [device] RAJA CUDA backend. Enabled when MFEM_USE_RAJA = YES

          and MFEM_USE_CUDA = YES. */

      RAJA_CUDA = 1 << 6,

      /** @brief [device] RAJA HIP backend. Enabled when MFEM_USE_RAJA = YES

          and MFEM_USE_HIP = YES. */

      RAJA_HIP = 1 << 7,

      /** @brief [host] OCCA CPU backend: sequential execution on each MPI rank.

          Enabled when MFEM_USE_OCCA = YES. */

      OCCA_CPU = 1 << 8,

      /// [host] OCCA OpenMP backend. Enabled when MFEM_USE_OCCA = YES.

      OCCA_OMP = 1 << 9,

      /** @brief [device] OCCA CUDA backend. Enabled when MFEM_USE_OCCA = YES

          and MFEM_USE_CUDA = YES. */

      OCCA_CUDA = 1 << 10,

      /** @brief [host] CEED CPU backend. GPU backends can still be used, but

          with expensive memory transfers. Enabled when MFEM_USE_CEED = YES. */

      CEED_CPU  = 1 << 11,

      /** @brief [device] CEED CUDA backend working together with the CUDA

          backend. Enabled when MFEM_USE_CEED = YES and MFEM_USE_CUDA = YES.

          NOTE: The current default libCEED CUDA backend is non-deterministic! */

      CEED_CUDA = 1 << 12,

      /** @brief [device] CEED HIP backend working together with the HIP

          backend. Enabled when MFEM_USE_CEED = YES and MFEM_USE_HIP = YES. */

      CEED_HIP = 1 << 13,

      /** @brief [device] Debug backend: host memory is READ/WRITE protected

          while a device is in use. It allows to test the "device" code-path

          (using separate host/device memory pools and host <-> device

          transfers) without any GPU hardware. As 'DEBUG' is sometimes used

          as a macro, `_DEVICE` has been added to avoid conflicts. */

      DEBUG_DEVICE = 1 << 14

   };


   /** @brief Additional useful constants. For example, the *_MASK constants can

       be used with Device::Allows(). */

   enum

   {

      /// Number of backends: from (1 << 0) to (1 << (NUM_BACKENDS-1)).

      NUM_BACKENDS = 15,


      /// Biwise-OR of all CPU backends

      CPU_MASK = CPU | RAJA_CPU | OCCA_CPU | CEED_CPU,

      /// Biwise-OR of all CUDA backends

      CUDA_MASK = CUDA | RAJA_CUDA | OCCA_CUDA | CEED_CUDA,

      /// Biwise-OR of all HIP backends

      HIP_MASK = HIP | RAJA_HIP | CEED_HIP,

      /// Biwise-OR of all OpenMP backends

      OMP_MASK = OMP | RAJA_OMP | OCCA_OMP,

      /// Bitwise-OR of all CEED backends

      CEED_MASK = CEED_CPU | CEED_CUDA | CEED_HIP,

      /// Biwise-OR of all device backends

      DEVICE_MASK = CUDA_MASK | HIP_MASK | DEBUG_DEVICE,

      /// Biwise-OR of all RAJA backends

      RAJA_MASK = RAJA_CPU | RAJA_OMP | RAJA_CUDA | RAJA_HIP,

      /// Biwise-OR of all OCCA backends

      OCCA_MASK = OCCA_CPU | OCCA_OMP | OCCA_CUDA

   };

};


/** @brief The MFEM Device class abstracts hardware devices such as GPUs, as

    well as programming models such as CUDA, OCCA, RAJA and OpenMP. */

/** This class represents a "virtual device" with the following properties:

    - At most one object of this class can be constructed and that object is

      controlled by its static methods.

    - If no Device object is constructed, the static methods will use a default

      global object which is never configured and always uses Backend::CPU.

    - Once configured, the object cannot be re-configured during the program

      lifetime.

    - MFEM classes use this object to determine where (host or device) to

      perform an operation and which backend implementation to use.

    - Multiple backends can be configured at the same time; currently, a fixed

      priority order is used to select a specific backend from the list of

      configured backends. See the Backend class and the Configure() method in

      this class for details. */


class Device

{

private:

   friend class MemoryManager;


   static bool device_env, mem_host_env, mem_device_env, mem_types_set;

   MFEM_ENZYME_INACTIVE static MFEM_EXPORT Device device_singleton;


   int dev = 0;   ///< Device ID of the configured device.

   int ngpu = -1; ///< Number of detected devices; -1: not initialized.


   /// Bitwise-OR of all configured backends.

   unsigned long backends = Backend::CPU;


   /// Set to true during configuration, except in 'device_singleton'.

   bool destroy_mm = false;

   bool mpi_gpu_aware = false;


   MemoryType host_mem_type = MemoryType::HOST;    ///< Current Host MemoryType

   MemoryClass host_mem_class = MemoryClass::HOST; ///< Current Host MemoryClass


   /// Current Device MemoryType

   MemoryType device_mem_type = MemoryType::HOST;

   /// Current Device MemoryClass

   MemoryClass device_mem_class = MemoryClass::HOST;


   // Delete copy constructor and copy assignment.

   Device(const Device &) = delete;

   Device &operator=(const Device &) = delete;


   // Access the Device singleton.

   static Device& Get() { return device_singleton; }


   /// Setup switcher based on configuration settings.

   void Setup(const std::string &device_option, const int device_id);


   /// Configure host/device MemoryType/MemoryClass.

   void UpdateMemoryTypeAndClass(const std::string &device_option);


   /// Configure the backends to include @a b.

   void MarkBackend(Backend::Id b) { backends |= b; }


public:

   /** @brief Default constructor. Unless Configure() is called later, the

       default Backend::CPU will be used. */

   /** @note At most one Device object can be constructed during the lifetime of

       a program.

       @note This object should be destroyed after all other MFEM objects that

       use the Device are destroyed. */

   Device();


   /** @brief Construct a Device and configure it based on the @a device string.

       See Configure() for more details. */

   /** @note At most one Device object can be constructed during the lifetime of

       a program.

       @note This object should be destroyed after all other MFEM objects that

       use the Device are destroyed. */


   Device(const std::string &device, const int device_id = 0)

   { Configure(device, device_id); }


   /// Destructor.

   ~Device();


   /// Configure the Device backends.

   /** The string parameter @a device must be a comma-separated list of backend

       string names (see below). The @a device_id argument specifies the ID of

       the actual devices (e.g. GPU) to use.

       - The available backends are described by the Backend class.

       - The string name of a backend is the lowercase version of the

         Backend::Id enumeration constant with '_' replaced by '-', e.g. the

         string name of 'RAJA_CPU' is 'raja-cpu'. The string name of the debug

         backend (Backend::Id 'DEBUG_DEVICE') is exceptionally set to 'debug'.

       - The 'cpu' backend is always enabled with lowest priority.

       - The current backend priority from highest to lowest is:

         'ceed-cuda', 'occa-cuda', 'raja-cuda', 'cuda',

         'ceed-hip', 'hip', 'debug',

         'occa-omp', 'raja-omp', 'omp',

         'ceed-cpu', 'occa-cpu', 'raja-cpu', 'cpu'.

       - The following backend aliases are also available: 'ceed-gpu',

         'occa-gpu', 'raja-gpu', and 'gpu' where they alias their respective

         '*-cuda' or '*-hip' backends depending on the MFEM build-time

         configuration.

       - Multiple backends can be configured at the same time.

       - Only one 'occa-*' backend can be configured at a time.

       - The backend 'occa-cuda' enables the 'cuda' backend unless 'raja-cuda'

         is already enabled.

       - The backend 'occa-omp' enables the 'omp' backend (if MFEM was built

         with MFEM_USE_OPENMP=YES) unless 'raja-omp' is already enabled.

       - Only one 'ceed-*' backend can be configured at a time.

       - The backend 'ceed-cpu' delegates to a libCEED CPU backend the setup and

         evaluation of the operator.

       - The backend 'ceed-cuda' delegates to a libCEED CUDA backend the setup

         and evaluation of operators and enables the 'cuda' backend to avoid

         transfers between host and device.

       - The backend 'ceed-hip' delegates to a libCEED HIP backend the setup

         and evaluation of operators and enables the 'hip' backend to avoid

         transfers between host and device.

       - The 'debug' backend should not be combined with other device backends.


       @note If the device is actually enabled, this method will also update the

       current host/device MemoryType and MemoryClass. */

   void Configure(const std::string &device, const int device_id = 0);


   /// Set the default host and device MemoryTypes, @a h_mt and @a d_mt.

   /** The host and device MemoryTypes are also set to be dual to each other.


       These two MemoryType%s are used by most MFEM classes when allocating

       memory used on host and device, respectively.


       This method can only be called before Device construction and

       configuration, and the specified memory types must be compatible with

       the subsequent Device configuration. */

   static void SetMemoryTypes(MemoryType h_mt, MemoryType d_mt);


   /// Print the configuration of the MFEM virtual device object.

   void Print(std::ostream &os = mfem::out);


   /// Return true if Configure() has been called previously.

   static inline bool IsConfigured() { return Get().ngpu >= 0; }


   /// Return true if an actual device (e.g. GPU) has been configured.

   static inline bool IsAvailable() { return Get().ngpu > 0; }


   /// Return true if any backend other than Backend::CPU is enabled.

   static inline bool IsEnabled() { return Get().backends & ~(Backend::CPU); }


   /// The opposite of IsEnabled().

   static inline bool IsDisabled() { return !IsEnabled(); }


   /// Get the device ID of the configured device.

   static inline int GetId() { return Get().dev; }


   /// Get the number of available devices (may be called before configuration).

   static int GetDeviceCount();


   /** @brief Return true if any of the backends in the backend mask, @a b_mask,

       are allowed. */

   /** This method can be used with any of the Backend::Id constants, the

       Backend::*_MASK, or combinations of those. */


   static inline bool Allows(unsigned long b_mask)

   { return Get().backends & b_mask; }


   /** @brief Get the current Host MemoryType. This is the MemoryType used by

       most MFEM classes when allocating memory used on the host.

   */

   static inline MemoryType GetHostMemoryType() { return Get().host_mem_type; }


   /** @brief Get the current Host MemoryClass. This is the MemoryClass used

       by most MFEM host Memory objects. */

   static inline MemoryClass GetHostMemoryClass() { return Get().host_mem_class; }


   /** @brief Get the current Device MemoryType. This is the MemoryType used by

       most MFEM classes when allocating memory to be used with device kernels.

   */

   static inline MemoryType GetDeviceMemoryType() { return Get().device_mem_type; }


   /// (DEPRECATED) Equivalent to GetDeviceMemoryType().

   /** @deprecated Use GetDeviceMemoryType() instead. */

   static inline MemoryType GetMemoryType() { return Get().device_mem_type; }


   /** @brief Get the current Device MemoryClass. This is the MemoryClass used

       by most MFEM device kernels to access Memory objects. */

   static inline MemoryClass GetDeviceMemoryClass() { return Get().device_mem_class; }


   /// (DEPRECATED) Equivalent to GetDeviceMemoryClass().

   /** @deprecated Use GetDeviceMemoryClass() instead. */

   static inline MemoryClass GetMemoryClass() { return Get().device_mem_class; }


   /** @brief Manually set the status of GPU-aware MPI flag for use in MPI

       communication routines which have optimized implementations for device

       buffers. */


   static void SetGPUAwareMPI(const bool force = true)

   { Get().mpi_gpu_aware = force; }


   /// Get the status of GPU-aware MPI flag.

   static bool GetGPUAwareMPI() { return Get().mpi_gpu_aware; }


   /** Query the device driver for what memory type a given @a ptr is allocated

    * with. */

   static MemoryType QueryMemoryType(const void* ptr);


   /** @brief The number of hardware compute units/streaming multiprocessors

       available on a given compute device @a device_id. */

   static int NumMultiprocessors(int device_id);


   /// Same as NumMultiprocessors(int), for the currently active device.

   static int NumMultiprocessors();


   /** @brief The number of threads in a warp on a given compute device

       @a device_id. */

   static int WarpSize(int device_id);


   /// Same as WarpSize(int), for the currently active device.

   static int WarpSize();


   /** @brief Gets the @a free and @a total memory on the device. */

   static void DeviceMem(size_t *free, size_t *total);

};


// Inline Memory access functions using the mfem::Device DeviceMemoryClass or

// the mfem::Device HostMemoryClass.


/** @brief Return the memory class to be used by the functions Read(), Write(),

    and ReadWrite(), while setting the device use flag in @a mem, if @a on_dev

    is true. */

template <typename T>


inline MemoryClass GetMemoryClass(const Memory<T> &mem, bool on_dev)

{

   if (!on_dev)

   {

      return Device::GetHostMemoryClass();

   }

   else

   {

      mem.UseDevice(true);

      return Device::GetDeviceMemoryClass();

   }

}


/** @brief Get a pointer for read access to @a mem with the mfem::Device's

    DeviceMemoryClass, if @a on_dev = true, or the mfem::Device's

    HostMemoryClass, otherwise. */

/** Also, if @a on_dev = true, the device flag of @a mem will be set. */

template <typename T>


inline const T *Read(const Memory<T> &mem, int size, bool on_dev = true)

{

   return mem.Read(GetMemoryClass(mem, on_dev), size);

}


/** @brief Shortcut to Read(const Memory<T> &mem, int size, false) */

template <typename T>


inline const T *HostRead(const Memory<T> &mem, int size)

{

   return mfem::Read(mem, size, false);

}


/** @brief Get a pointer for write access to @a mem with the mfem::Device's

    DeviceMemoryClass, if @a on_dev = true, or the mfem::Device's

    HostMemoryClass, otherwise. */

/** Also, if @a on_dev = true, the device flag of @a mem will be set. */

template <typename T>


inline T *Write(Memory<T> &mem, int size, bool on_dev = true)

{

   return mem.Write(GetMemoryClass(mem, on_dev), size);

}


/** @brief Shortcut to Write(const Memory<T> &mem, int size, false) */

template <typename T>


inline T *HostWrite(Memory<T> &mem, int size)

{

   return mfem::Write(mem, size, false);

}


/** @brief Get a pointer for read+write access to @a mem with the mfem::Device's

    DeviceMemoryClass, if @a on_dev = true, or the mfem::Device's

    HostMemoryClass, otherwise. */

/** Also, if @a on_dev = true, the device flag of @a mem will be set. */

template <typename T>


inline T *ReadWrite(Memory<T> &mem, int size, bool on_dev = true)

{

   return mem.ReadWrite(GetMemoryClass(mem, on_dev), size);

}


/** @brief Shortcut to ReadWrite(Memory<T> &mem, int size, false) */

template <typename T>


inline T *HostReadWrite(Memory<T> &mem, int size)

{

   return mfem::ReadWrite(mem, size, false);

}


} // namespace mfem


#endif // MFEM_DEVICE_HPP

mfem::Device
The MFEM Device class abstracts hardware devices such as GPUs, as well as programming models such as ...
Definition device.hpp:124

mfem::Device::GetHostMemoryType
static MemoryType GetHostMemoryType()
Get the current Host MemoryType. This is the MemoryType used by most MFEM classes when allocating mem...
Definition device.hpp:268

mfem::Device::~Device
~Device()
Destructor.
Definition device.cpp:156

mfem::Device::GetMemoryClass
static MemoryClass GetMemoryClass()
(DEPRECATED) Equivalent to GetDeviceMemoryClass().
Definition device.hpp:289

mfem::Device::DeviceMem
static void DeviceMem(size_t *free, size_t *total)
Gets the free and total memory on the device.
Definition device.cpp:700

mfem::Device::GetHostMemoryClass
static MemoryClass GetHostMemoryClass()
Get the current Host MemoryClass. This is the MemoryClass used by most MFEM host Memory objects.
Definition device.hpp:272

mfem::Device::Configure
void Configure(const std::string &device, const int device_id=0)
Configure the Device backends.
Definition device.cpp:189

mfem::Device::IsAvailable
static bool IsAvailable()
Return true if an actual device (e.g. GPU) has been configured.
Definition device.hpp:244

mfem::Device::SetGPUAwareMPI
static void SetGPUAwareMPI(const bool force=true)
Manually set the status of GPU-aware MPI flag for use in MPI communication routines which have optimi...
Definition device.hpp:294

mfem::Device::GetMemoryType
static MemoryType GetMemoryType()
(DEPRECATED) Equivalent to GetDeviceMemoryType().
Definition device.hpp:281

mfem::Device::NumMultiprocessors
static int NumMultiprocessors()
Same as NumMultiprocessors(int), for the currently active device.
Definition device.cpp:736

mfem::Device::IsConfigured
static bool IsConfigured()
Return true if Configure() has been called previously.
Definition device.hpp:241

mfem::Device::QueryMemoryType
static MemoryType QueryMemoryType(const void *ptr)
Definition device.cpp:618

mfem::Device::Print
void Print(std::ostream &os=mfem::out)
Print the configuration of the MFEM virtual device object.
Definition device.cpp:317

mfem::Device::Allows
static bool Allows(unsigned long b_mask)
Return true if any of the backends in the backend mask, b_mask, are allowed.
Definition device.hpp:262

mfem::Device::Device
Device(const std::string &device, const int device_id=0)
Construct a Device and configure it based on the device string. See Configure() for more details.
Definition device.hpp:180

mfem::Device::SetMemoryTypes
static void SetMemoryTypes(MemoryType h_mt, MemoryType d_mt)
Set the default host and device MemoryTypes, h_mt and d_mt.
Definition device.cpp:294

mfem::Device::GetGPUAwareMPI
static bool GetGPUAwareMPI()
Get the status of GPU-aware MPI flag.
Definition device.hpp:298

mfem::Device::GetDeviceMemoryClass
static MemoryClass GetDeviceMemoryClass()
Get the current Device MemoryClass. This is the MemoryClass used by most MFEM device kernels to acces...
Definition device.hpp:285

mfem::Device::GetId
static int GetId()
Get the device ID of the configured device.
Definition device.hpp:253

mfem::Device::WarpSize
static int WarpSize()
Same as WarpSize(int), for the currently active device.
Definition device.cpp:764

mfem::Device::GetDeviceCount
static int GetDeviceCount()
Get the number of available devices (may be called before configuration).
Definition device.cpp:425

mfem::Device::IsEnabled
static bool IsEnabled()
Return true if any backend other than Backend::CPU is enabled.
Definition device.hpp:247

mfem::Device::Device
Device()
Default constructor. Unless Configure() is called later, the default Backend::CPU will be used.
Definition device.cpp:74

mfem::Device::GetDeviceMemoryType
static MemoryType GetDeviceMemoryType()
Get the current Device MemoryType. This is the MemoryType used by most MFEM classes when allocating m...
Definition device.hpp:277

mfem::Device::IsDisabled
static bool IsDisabled()
The opposite of IsEnabled().
Definition device.hpp:250

mfem::MemoryManager
Definition mem_manager.hpp:625

mfem::Memory
Class used by MFEM to store pointers to host and/or device memory.
Definition mem_manager.hpp:168

mfem::Memory::Write
T * Write(MemoryClass mc, int size)
Get write-only access to the memory with the given MemoryClass.
Definition mem_manager.hpp:1218

mfem::Memory::ReadWrite
T * ReadWrite(MemoryClass mc, int size)
Get read-write access to the memory with the given MemoryClass.
Definition mem_manager.hpp:1192

mfem::Memory::UseDevice
bool UseDevice() const
Read the internal device flag.
Definition mem_manager.hpp:315

mfem::Memory::Read
const T * Read(MemoryClass mc, int size) const
Get read-only access to the memory with the given MemoryClass.
Definition mem_manager.hpp:1205

enzyme.hpp

globals.hpp

b
real_t b
Definition lissajous.cpp:42

mem_manager.hpp

mfem
Definition CodeDocumentation.dox:1

mfem::Read
const T * Read(const Memory< T > &mem, int size, bool on_dev=true)
Get a pointer for read access to mem with the mfem::Device's DeviceMemoryClass, if on_dev = true,...
Definition device.hpp:348

mfem::GetMemoryClass
MemoryClass GetMemoryClass(const Memory< T > &mem, bool on_dev)
Return the memory class to be used by the functions Read(), Write(), and ReadWrite(),...
Definition device.hpp:330

mfem::HostReadWrite
T * HostReadWrite(Memory< T > &mem, int size)
Shortcut to ReadWrite(Memory<T> &mem, int size, false)
Definition device.hpp:389

mfem::HostRead
const T * HostRead(const Memory< T > &mem, int size)
Shortcut to Read(const Memory<T> &mem, int size, false)
Definition device.hpp:355

mfem::Write
T * Write(Memory< T > &mem, int size, bool on_dev=true)
Get a pointer for write access to mem with the mfem::Device's DeviceMemoryClass, if on_dev = true,...
Definition device.hpp:365

mfem::out
OutStream out(std::cout)
Global stream used by the library for standard output. Initially it uses the same std::streambuf as s...
Definition globals.hpp:66

mfem::MemoryClass
MemoryClass
Memory classes identify sets of memory types.
Definition mem_manager.hpp:81

mfem::MemoryClass::HOST
@ HOST

mfem::ReadWrite
T * ReadWrite(Memory< T > &mem, int size, bool on_dev=true)
Get a pointer for read+write access to mem with the mfem::Device's DeviceMemoryClass,...
Definition device.hpp:382

mfem::HostWrite
T * HostWrite(Memory< T > &mem, int size)
Shortcut to Write(const Memory<T> &mem, int size, false)
Definition device.hpp:372

mfem::MemoryType
MemoryType
Memory types supported by MFEM.
Definition mem_manager.hpp:39

mfem::MemoryType::HOST
@ HOST
Host memory; using new[] and delete[].

mfem::Backend
MFEM backends.
Definition device.hpp:30

mfem::Backend::Id
Id
In the documentation below, we use square brackets to indicate the type of the backend: host or devic...
Definition device.hpp:34

mfem::Backend::RAJA_OMP
@ RAJA_OMP
[host] RAJA OpenMP backend. Enabled when MFEM_USE_RAJA = YES and MFEM_USE_OPENMP = YES.
Definition device.hpp:48

mfem::Backend::RAJA_CUDA
@ RAJA_CUDA
[device] RAJA CUDA backend. Enabled when MFEM_USE_RAJA = YES and MFEM_USE_CUDA = YES.
Definition device.hpp:51

mfem::Backend::DEBUG_DEVICE
@ DEBUG_DEVICE
[device] Debug backend: host memory is READ/WRITE protected while a device is in use....
Definition device.hpp:78

mfem::Backend::RAJA_CPU
@ RAJA_CPU
[host] RAJA CPU backend: sequential execution on each MPI rank. Enabled when MFEM_USE_RAJA = YES.
Definition device.hpp:45

mfem::Backend::OMP
@ OMP
[host] OpenMP backend. Enabled when MFEM_USE_OPENMP = YES.
Definition device.hpp:38

mfem::Backend::HIP
@ HIP
[device] HIP backend. Enabled when MFEM_USE_HIP = YES.
Definition device.hpp:42

mfem::Backend::OCCA_OMP
@ OCCA_OMP
[host] OCCA OpenMP backend. Enabled when MFEM_USE_OCCA = YES.
Definition device.hpp:59

mfem::Backend::RAJA_HIP
@ RAJA_HIP
[device] RAJA HIP backend. Enabled when MFEM_USE_RAJA = YES and MFEM_USE_HIP = YES.
Definition device.hpp:54

mfem::Backend::OCCA_CUDA
@ OCCA_CUDA
[device] OCCA CUDA backend. Enabled when MFEM_USE_OCCA = YES and MFEM_USE_CUDA = YES.
Definition device.hpp:62

mfem::Backend::CEED_CPU
@ CEED_CPU
[host] CEED CPU backend. GPU backends can still be used, but with expensive memory transfers....
Definition device.hpp:65

mfem::Backend::OCCA_CPU
@ OCCA_CPU
[host] OCCA CPU backend: sequential execution on each MPI rank. Enabled when MFEM_USE_OCCA = YES.
Definition device.hpp:57

mfem::Backend::CEED_CUDA
@ CEED_CUDA
[device] CEED CUDA backend working together with the CUDA backend. Enabled when MFEM_USE_CEED = YES a...
Definition device.hpp:69

mfem::Backend::CPU
@ CPU
[host] Default CPU backend: sequential execution on each MPI rank.
Definition device.hpp:36

mfem::Backend::CUDA
@ CUDA
[device] CUDA backend. Enabled when MFEM_USE_CUDA = YES.
Definition device.hpp:40

mfem::Backend::CEED_HIP
@ CEED_HIP
[device] CEED HIP backend working together with the HIP backend. Enabled when MFEM_USE_CEED = YES and...
Definition device.hpp:72

mfem::Backend::RAJA_MASK
@ RAJA_MASK
Biwise-OR of all RAJA backends.
Definition device.hpp:101

mfem::Backend::DEVICE_MASK
@ DEVICE_MASK
Biwise-OR of all device backends.
Definition device.hpp:99

mfem::Backend::CEED_MASK
@ CEED_MASK
Bitwise-OR of all CEED backends.
Definition device.hpp:97

mfem::Backend::OCCA_MASK
@ OCCA_MASK
Biwise-OR of all OCCA backends.
Definition device.hpp:103

mfem::Backend::HIP_MASK
@ HIP_MASK
Biwise-OR of all HIP backends.
Definition device.hpp:93

mfem::Backend::CPU_MASK
@ CPU_MASK
Biwise-OR of all CPU backends.
Definition device.hpp:89

mfem::Backend::NUM_BACKENDS
@ NUM_BACKENDS
Number of backends: from (1 << 0) to (1 << (NUM_BACKENDS-1)).
Definition device.hpp:86

mfem::Backend::CUDA_MASK
@ CUDA_MASK
Biwise-OR of all CUDA backends.
Definition device.hpp:91

mfem::Backend::OMP_MASK
@ OMP_MASK
Biwise-OR of all OpenMP backends.
Definition device.hpp:95