4.0/device_8hpp_source.html

 // Copyright (c) 2010, Lawrence Livermore National Security, LLC. Produced at

 // the Lawrence Livermore National Laboratory. LLNL-CODE-443211. All Rights

 // reserved. See file COPYRIGHT for details.

 //

 // This file is part of the MFEM library. For more information and source code

 // availability see http://mfem.org.

 //

 // MFEM is free software; you can redistribute it and/or modify it under the

 // terms of the GNU Lesser General Public License (as published by the Free

 // Software Foundation) version 2.1 dated February 1999.


 #ifndef MFEM_DEVICE_HPP

 #define MFEM_DEVICE_HPP


 #include "globals.hpp"

 #include "mem_manager.hpp"


 namespace mfem

 {


 /// MFEM backends.

 /** Individual backends will generally implement only a subset of the kernels

     implemented by the default CPU backend. The goal of the backends is to

     accelerate data-parallel portions of the code and they can use a device

     memory space (e.g. GPUs) or share the memory space of the host (OpenMP). */

 struct Backend

 {

    /** @brief In the documentation below, we use square brackets to indicate the

        type of the backend: host or device. */

    enum Id

    {

       /// [host] Default CPU backend: sequential execution on each MPI rank.

       CPU = 1 << 0,

       /// [host] OpenMP backend. Enabled when MFEM_USE_OPENMP = YES.

       OMP = 1 << 1,

       /// [device] CUDA backend. Enabled when MFEM_USE_CUDA = YES.

       CUDA = 1 << 2,

       /** @brief [host] RAJA CPU backend: sequential execution on each MPI rank.

           Enabled when MFEM_USE_RAJA = YES. */

       RAJA_CPU = 1 << 3,

       /** @brief [host] RAJA OpenMP backend. Enabled when MFEM_USE_RAJA = YES

           and MFEM_USE_OPENMP = YES. */

       RAJA_OMP = 1 << 4,

       /** @brief [device] RAJA CUDA backend. Enabled when MFEM_USE_RAJA = YES

           and MFEM_USE_CUDA = YES. */

       RAJA_CUDA = 1 << 5,

       /** @brief [host] OCCA CPU backend: sequential execution on each MPI rank.

           Enabled when MFEM_USE_OCCA = YES. */

       OCCA_CPU = 1 << 6,

       /// [host] OCCA OpenMP backend. Enabled when MFEM_USE_OCCA = YES.

       OCCA_OMP = 1 << 7,

       /** @brief [device] OCCA CUDA backend. Enabled when MFEM_USE_OCCA = YES

           and MFEM_USE_CUDA = YES. */

       OCCA_CUDA = 1 << 8

    };


    /** @brief Additional useful constants. For example, the *_MASK constants can

        be used with Device::Allows(). */

    enum

    {

       /// Number of backends: from (1 << 0) to (1 << (NUM_BACKENDS-1)).

       NUM_BACKENDS = 9,


       /// Biwise-OR of all CPU backends

       CPU_MASK = CPU | RAJA_CPU | OCCA_CPU,

       /// Biwise-OR of all CUDA backends

       CUDA_MASK = CUDA | RAJA_CUDA | OCCA_CUDA,

       /// Biwise-OR of all OpenMP backends

       OMP_MASK = OMP | RAJA_OMP | OCCA_OMP,

       /// Biwise-OR of all device backends

       DEVICE_MASK = CUDA_MASK,


       /// Biwise-OR of all RAJA backends

       RAJA_MASK = RAJA_CPU | RAJA_OMP | RAJA_CUDA,

       /// Biwise-OR of all OCCA backends

       OCCA_MASK = OCCA_CPU | OCCA_OMP | OCCA_CUDA

    };

 };


 /** @brief The MFEM Device class abstracts hardware devices such as GPUs, as

     well as programming models such as CUDA, OCCA, RAJA and OpenMP. */

 /** This class represents a "virtual device" with the following properties:

     - At most one object of this class can be constructed and that object is

       controlled by its static methods.

     - If no Device object is constructed, the static methods will use a default

       global object which is never configured and always uses Backend::CPU.

     - Once configured, the object cannot be re-configured during the program

       lifetime.

     - MFEM classes use this object to determine where (host or device) to

       perform an operation and which backend implementation to use.

     - Multiple backends can be configured at the same time; currently, a fixed

       priority order is used to select a specific backend from the list of

       configured backends. See the Backend class and the Configure() method in

       this class for details. */

 class Device

 {

 private:

    enum MODES {SEQUENTIAL, ACCELERATED};


    static Device device_singleton;


    MODES mode;

    int dev = 0; ///< Device ID of the configured device.

    int ngpu = -1; ///< Number of detected devices; -1: not initialized.

    unsigned long backends; ///< Bitwise-OR of all configured backends.

    /// Set to true during configuration, except in 'device_singleton'.

    bool destroy_mm;


    MemoryType mem_type;    ///< Current Device MemoryType

    MemoryClass mem_class;  ///< Current Device MemoryClass


    Device(Device const&);

    void operator=(Device const&);

    static Device& Get() { return device_singleton; }


    /// Setup switcher based on configuration settings

    void Setup(const int dev = 0);


    void MarkBackend(Backend::Id b) { backends |= b; }


    void UpdateMemoryTypeAndClass();


    /// Enable the use of the configured device in the code that follows.

    /** After this call MFEM classes will use the backend kernels whenever

        possible, transferring data automatically to the device, if necessary.


        If the only configured backend is the default host CPU one, the device

        will remain disabled.


        If the device is actually enabled, this method will also update the

        current MemoryType and MemoryClass. */

    static void Enable();


 public:

    /** @brief Default constructor. Unless Configure() is called later, the

        default Backend::CPU will be used. */

    /** @note At most one Device object can be constructed during the lifetime of

        a program.

        @note This object should be destroyed after all other MFEM objects that

        use the Device are destroyed. */

    Device()

       : mode(Device::SEQUENTIAL),

         backends(Backend::CPU),

         destroy_mm(false),

         mem_type(MemoryType::HOST),

         mem_class(MemoryClass::HOST)

    { }


    /** @brief Construct a Device and configure it based on the @a device string.

        See Configure() for more details. */

    /** @note At most one Device object can be constructed during the lifetime of

        a program.

        @note This object should be destroyed after all other MFEM objects that

        use the Device are destroyed. */

    Device(const std::string &device, const int dev = 0)

       : mode(Device::SEQUENTIAL),

         backends(Backend::CPU),

         destroy_mm(false),

         mem_type(MemoryType::HOST),

         mem_class(MemoryClass::HOST)

    { Configure(device, dev); }


    /// Destructor.

    ~Device();


    /// Configure the Device backends.

    /** The string parameter @a device must be a comma-separated list of backend

        string names (see below). The @a dev argument specifies the ID of the

        actual devices (e.g. GPU) to use.

        * The available backends are described by the Backend class.

        * The string name of a backend is the lowercase version of the

          Backend::Id enumeration constant with '_' replaced by '-', e.g. the

          string name of 'RAJA_CPU' is 'raja-cpu'.

        * The 'cpu' backend is always enabled with lowest priority.

        * The current backend priority from highest to lowest is: 'occa-cuda',

          'raja-cuda', 'cuda', 'occa-omp', 'raja-omp', 'omp', 'occa-cpu',

          'raja-cpu', 'cpu'.

        * Multiple backends can be configured at the same time.

        * Only one 'occa-*' backend can be configured at a time.

        * The backend 'occa-cuda' enables the 'cuda' backend unless 'raja-cuda'

          is already enabled. */

    void Configure(const std::string &device, const int dev = 0);


    /// Print the configuration of the MFEM virtual device object.

    void Print(std::ostream &out = mfem::out);


    /// Return true if Configure() has been called previously.

    static inline bool IsConfigured() { return Get().ngpu >= 0; }


    /// Return true if an actual device (e.g. GPU) has been configured.

    static inline bool IsAvailable() { return Get().ngpu > 0; }


    /// Return true if any backend other than Backend::CPU is enabled.

    static inline bool IsEnabled() { return Get().mode == ACCELERATED; }


    /// The opposite of IsEnabled().

    static inline bool IsDisabled() { return !IsEnabled(); }


    /** @brief Return true if any of the backends in the backend mask, @a b_mask,

        are allowed. */

    /** This method can be used with any of the Backend::Id constants, the

        Backend::*_MASK, or combinations of those. */

    static inline bool Allows(unsigned long b_mask)

    { return Get().backends & b_mask; }


    /** @brief Get the current Device MemoryType. This is the MemoryType used by

        most MFEM classes when allocating memory to be used with device kernels.

    */

    static inline MemoryType GetMemoryType() { return Get().mem_type; }


    /** @brief Get the current Device MemoryClass. This is the MemoryClass used

        by most MFEM device kernels to access Memory objects. */

    static inline MemoryClass GetMemoryClass() { return Get().mem_class; }

 };


 // Inline Memory access functions using the mfem::Device MemoryClass or

 // MemoryClass::HOST.


 /** @brief Get a pointer for read access to @a mem with the mfem::Device

     MemoryClass, if @a on_dev = true, or MemoryClass::HOST, otherwise. */

 /** Also, if @a on_dev = true, the device flag of @a mem will be set. */

 template <typename T>

 inline const T *Read(const Memory<T> &mem, int size, bool on_dev = true)

 {

    if (!on_dev)

    {

       return mem.Read(MemoryClass::HOST, size);

    }

    else

    {

       mem.UseDevice(true);

       return mem.Read(Device::GetMemoryClass(), size);

    }

 }


 /** @brief Shortcut to Read(const Memory<T> &mem, int size, false) */

 template <typename T>

 inline const T *HostRead(const Memory<T> &mem, int size)

 {

    return mfem::Read(mem, size, false);

 }


 /** @brief Get a pointer for write access to @a mem with the mfem::Device

     MemoryClass, if @a on_dev = true, or MemoryClass::HOST, otherwise. */

 /** Also, if @a on_dev = true, the device flag of @a mem will be set. */

 template <typename T>

 inline T *Write(Memory<T> &mem, int size, bool on_dev = true)

 {

    if (!on_dev)

    {

       return mem.Write(MemoryClass::HOST, size);

    }

    else

    {

       mem.UseDevice(true);

       return mem.Write(Device::GetMemoryClass(), size);

    }

 }


 /** @brief Shortcut to Write(const Memory<T> &mem, int size, false) */

 template <typename T>

 inline const T *HostWrite(const Memory<T> &mem, int size)

 {

    return mfem::Write(mem, size, false);

 }


 /** @brief Get a pointer for read+write access to @a mem with the mfem::Device

     MemoryClass, if @a on_dev = true, or MemoryClass::HOST, otherwise. */

 /** Also, if @a on_dev = true, the device flag of @a mem will be set. */

 template <typename T>

 inline T *ReadWrite(Memory<T> &mem, int size, bool on_dev = true)

 {

    if (!on_dev)

    {

       return mem.ReadWrite(MemoryClass::HOST, size);

    }

    else

    {

       mem.UseDevice(true);

       return mem.ReadWrite(Device::GetMemoryClass(), size);

    }

 }


 /** @brief Shortcut to ReadWrite(const Memory<T> &mem, int size, false) */

 template <typename T>

 inline const T *HostReadWrite(const Memory<T> &mem, int size)

 {

    return mfem::ReadWrite(mem, size, false);

 }


 } // mfem


 #endif // MFEM_DEVICE_HPP

mfem::Device::GetMemoryClass
static MemoryClass GetMemoryClass()
Get the current Device MemoryClass. This is the MemoryClass used by most MFEM device kernels to acces...
Definition: device.hpp:214

mfem::Device::IsAvailable
static bool IsAvailable()
Return true if an actual device (e.g. GPU) has been configured.
Definition: device.hpp:192

mfem::Backend::OMP
[host] OpenMP backend. Enabled when MFEM_USE_OPENMP = YES.
Definition: device.hpp:35

mfem::Device::IsConfigured
static bool IsConfigured()
Return true if Configure() has been called previously.
Definition: device.hpp:189

mfem::Device::~Device
~Device()
Destructor.
Definition: device.cpp:54

mem_manager.hpp

mfem::Write
T * Write(Memory< T > &mem, int size, bool on_dev=true)
Get a pointer for write access to mem with the mfem::Device MemoryClass, if on_dev = true...
Definition: device.hpp:249

mfem::Device::Device
Device(const std::string &device, const int dev=0)
Construct a Device and configure it based on the device string. See Configure() for more details...
Definition: device.hpp:156

mfem::Memory::Write
T * Write(MemoryClass mc, int size)
Get write-only access to the memory with the given MemoryClass.
Definition: mem_manager.hpp:628

mfem::Device::Print
void Print(std::ostream &out=mfem::out)
Print the configuration of the MFEM virtual device object.
Definition: device.cpp:98

mfem::Device::IsEnabled
static bool IsEnabled()
Return true if any backend other than Backend::CPU is enabled.
Definition: device.hpp:195

mfem::Device::IsDisabled
static bool IsDisabled()
The opposite of IsEnabled().
Definition: device.hpp:198

mfem::Device::Configure
void Configure(const std::string &device, const int dev=0)
Configure the Device backends.
Definition: device.cpp:59

mfem::Device::Device
Device()
Default constructor. Unless Configure() is called later, the default Backend::CPU will be used...
Definition: device.hpp:142

mfem::Backend::OCCA_CUDA
[device] OCCA CUDA backend. Enabled when MFEM_USE_OCCA = YES and MFEM_USE_CUDA = YES.
Definition: device.hpp:54

mfem::Backend::RAJA_CPU
[host] RAJA CPU backend: sequential execution on each MPI rank. Enabled when MFEM_USE_RAJA = YES...
Definition: device.hpp:40

mfem::Backend::RAJA_OMP
[host] RAJA OpenMP backend. Enabled when MFEM_USE_RAJA = YES and MFEM_USE_OPENMP = YES...
Definition: device.hpp:43

mfem::Backend::NUM_BACKENDS
Number of backends: from (1 &lt;&lt; 0) to (1 &lt;&lt; (NUM_BACKENDS-1)).
Definition: device.hpp:62

mfem::Backend
MFEM backends.
Definition: device.hpp:26

mfem::Device::GetMemoryType
static MemoryType GetMemoryType()
Get the current Device MemoryType. This is the MemoryType used by most MFEM classes when allocating m...
Definition: device.hpp:210

mfem::Backend::OMP_MASK
Biwise-OR of all OpenMP backends.
Definition: device.hpp:69

mfem::Backend::OCCA_OMP
[host] OCCA OpenMP backend. Enabled when MFEM_USE_OCCA = YES.
Definition: device.hpp:51

mfem::Backend::CPU
[host] Default CPU backend: sequential execution on each MPI rank.
Definition: device.hpp:33

mfem::Read
const T * Read(const Memory< T > &mem, int size, bool on_dev=true)
Get a pointer for read access to mem with the mfem::Device MemoryClass, if on_dev = true...
Definition: device.hpp:225

mfem::Backend::CUDA_MASK
Biwise-OR of all CUDA backends.
Definition: device.hpp:67

mfem::Backend::CPU_MASK
Biwise-OR of all CPU backends.
Definition: device.hpp:65

mfem::MemoryType
MemoryType
Memory types supported by MFEM.
Definition: mem_manager.hpp:27

mfem::Device::Allows
static bool Allows(unsigned long b_mask)
Return true if any of the backends in the backend mask, b_mask, are allowed.
Definition: device.hpp:204

mfem::HostRead
const T * HostRead(const Memory< T > &mem, int size)
Shortcut to Read(const Memory&lt;T&gt; &amp;mem, int size, false)
Definition: device.hpp:240

mfem::ReadWrite
T * ReadWrite(Memory< T > &mem, int size, bool on_dev=true)
Get a pointer for read+write access to mem with the mfem::Device MemoryClass, if on_dev = true...
Definition: device.hpp:273

mfem::HostReadWrite
const T * HostReadWrite(const Memory< T > &mem, int size)
Shortcut to ReadWrite(const Memory&lt;T&gt; &amp;mem, int size, false)
Definition: device.hpp:288

mfem::MemoryType::HOST
Host memory; using new[] and delete[].

mfem::Memory::ReadWrite
T * ReadWrite(MemoryClass mc, int size)
Get read-write access to the memory with the given MemoryClass.
Definition: mem_manager.hpp:601

mfem::Backend::OCCA_MASK
Biwise-OR of all OCCA backends.
Definition: device.hpp:76

mfem::Backend::Id
Id
In the documentation below, we use square brackets to indicate the type of the backend: host or devic...
Definition: device.hpp:30

mfem::Memory
Class used by MFEM to store pointers to host and/or device memory.
Definition: mem_manager.hpp:102

mfem::Backend::RAJA_MASK
Biwise-OR of all RAJA backends.
Definition: device.hpp:74

mfem::HostWrite
const T * HostWrite(const Memory< T > &mem, int size)
Shortcut to Write(const Memory&lt;T&gt; &amp;mem, int size, false)
Definition: device.hpp:264

mfem::Memory::UseDevice
bool UseDevice() const
Read the internal device flag.
Definition: mem_manager.hpp:207

globals.hpp

mfem::Backend::DEVICE_MASK
Biwise-OR of all device backends.
Definition: device.hpp:71

mfem::out
OutStream out(std::cout)
Global stream used by the library for standard output. Initially it uses the same std::streambuf as s...
Definition: globals.hpp:64

mfem::Device
The MFEM Device class abstracts hardware devices such as GPUs, as well as programming models such as ...
Definition: device.hpp:96

mfem::Backend::RAJA_CUDA
[device] RAJA CUDA backend. Enabled when MFEM_USE_RAJA = YES and MFEM_USE_CUDA = YES.
Definition: device.hpp:46

mfem::Memory::Read
const T * Read(MemoryClass mc, int size) const
Get read-only access to the memory with the given MemoryClass.
Definition: mem_manager.hpp:614

mfem::MemoryClass
MemoryClass
Memory classes identify subsets of memory types.
Definition: mem_manager.hpp:40

mfem::Backend::OCCA_CPU
[host] OCCA CPU backend: sequential execution on each MPI rank. Enabled when MFEM_USE_OCCA = YES...
Definition: device.hpp:49

mfem::Backend::CUDA
[device] CUDA backend. Enabled when MFEM_USE_CUDA = YES.
Definition: device.hpp:37