4.9/reducers_8hpp_source.html

// Copyright (c) 2010-2025, Lawrence Livermore National Security, LLC. Produced

// at the Lawrence Livermore National Laboratory. All Rights reserved. See files

// LICENSE and NOTICE for details. LLNL-CODE-806117.

//

// This file is part of the MFEM library. For more information and source code

// availability visit https://mfem.org.

//

// MFEM is free software; you can redistribute it and/or modify it under the

// terms of the BSD-3 license. We welcome feedback and contributions, see file

// CONTRIBUTING.md for details.


#ifndef MFEM_REDUCERS_HPP

#define MFEM_REDUCERS_HPP


#include "array.hpp"

#include "forall.hpp"


#include <cmath>

#include <limits>

#include <type_traits>


namespace mfem

{


/// Pair of values which can be used in device code


template <class A, class B> struct DevicePair

{

   A first;

   B second;

};


/// Two pairs for the min/max values and their location indices


template <class A, class B> struct MinMaxLocScalar

{

   A min_val;

   A max_val;

   B min_loc;

   B max_loc;

};


/// @brief a += b


template <class T> struct SumReducer

{

   using value_type = T;


   static MFEM_HOST_DEVICE void Join(value_type &a, const value_type &b)

   {

      a += b;

   }


   static MFEM_HOST_DEVICE void SetInitialValue(value_type &a) { a = T(0); }

};


/// @brief a *= b


template <class T> struct MultReducer

{

   using value_type = T;


   static MFEM_HOST_DEVICE void Join(value_type &a, const value_type &b)

   {

      a *= b;

   }


   static MFEM_HOST_DEVICE void SetInitialValue(value_type &a) { a = T(1); }

};


/// @brief a &= b


template <class T> struct BAndReducer

{

   static_assert(std::is_integral<T>::value, "Only works for integral types");

   using value_type = T;


   static MFEM_HOST_DEVICE void Join(value_type &a, const value_type &b)

   {

      a &= b;

   }


   static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)

   {

      // sets all bits, does not work for floating point types

      // bitwise operators are not defined for floating point types anyways

      a = ~T(0);

   }


};


/// @brief a |= b


template <class T> struct BOrReducer

{

   static_assert(std::is_integral<T>::value, "Only works for integral types");

   using value_type = T;


   static MFEM_HOST_DEVICE void Join(value_type &a, const value_type &b)

   {

      a |= b;

   }


   static MFEM_HOST_DEVICE void SetInitialValue(T &a) { a = T(0); }

};


/// @brief a = min(a,b)


template <class T> struct MinReducer

{

   using value_type = T;


   static MFEM_HOST_DEVICE void Join(value_type &a, value_type b)

   {

      if (b < a)

      {

         a = b;

      }

   }


   // If we use std::numeric_limits<T>::max() in host-device method, Cuda

   // complains about calling host-only constexpr functions in device code

   // without --expt-relaxed-constexpr, so we define the following constant as a

   // workaround for the Cuda warning.

   static constexpr T max_val = std::numeric_limits<T>::max();


   static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)

   {

      a = max_val;

   }


};


template <> struct MinReducer<float>

{

   using value_type = float;


   static MFEM_HOST_DEVICE void Join(value_type &a, value_type b)

   {

      a = fmin(a, b);

   }


   static MFEM_HOST_DEVICE void SetInitialValue(value_type &a) { a = HUGE_VALF; }

};


template <> struct MinReducer<double>

{

   using value_type = double;


   static MFEM_HOST_DEVICE void Join(value_type &a, value_type b)

   {

      a = fmin(a, b);

   }


   static MFEM_HOST_DEVICE void SetInitialValue(value_type &a) { a = HUGE_VAL; }

};


/// @brief a = max(a,b)


template <class T> struct MaxReducer

{

   using value_type = T;


   static MFEM_HOST_DEVICE void Join(value_type &a, value_type b)

   {

      if (a < b)

      {

         a = b;

      }

   }


   // If we use std::numeric_limits<T>::min() in host-device method, Cuda

   // complains about calling host-only constexpr functions in device code

   // without --expt-relaxed-constexpr, so we define the following constant as a

   // workaround for the Cuda warning.

   static constexpr T min_val = std::numeric_limits<T>::min();


   static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)

   {

      a = min_val;

   }


};


template <> struct MaxReducer<float>

{

   using value_type = float;


   static MFEM_HOST_DEVICE void Join(value_type &a, value_type b)

   {

      a = fmax(a, b);

   }


   static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)

   {

      a = -HUGE_VALF;

   }


};


template <> struct MaxReducer<double>

{

   using value_type = double;


   static MFEM_HOST_DEVICE void Join(value_type &a, value_type b)

   {

      a = fmax(a, b);

   }


   static MFEM_HOST_DEVICE void SetInitialValue(value_type &a) { a = -HUGE_VAL; }

};


/// @brief a = minmax(a,b)


template <class T> struct MinMaxReducer

{

   using value_type = DevicePair<T, T>;


   static MFEM_HOST_DEVICE void Join(value_type &a, const value_type &b)

   {

      if (b.first < a.first)

      {

         a.first = b.first;

      }

      if (b.second > a.second)

      {

         a.second = b.second;

      }

   }


   // If we use std::numeric_limits<T>::min() (or max()) in host-device method,

   // Cuda complains about calling host-only constexpr functions in device code

   // without --expt-relaxed-constexpr, so we define the following constants as

   // a workaround for the Cuda warning.

   static constexpr T min_val = std::numeric_limits<T>::min();

   static constexpr T max_val = std::numeric_limits<T>::max();


   static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)

   {

      a = value_type{max_val, min_val};

   }


};


template <> struct MinMaxReducer<float>

{

   using value_type = DevicePair<float, float>;


   static MFEM_HOST_DEVICE void Join(value_type &a, value_type b)

   {

      a.first = fmin(a.first, b.first);

      a.second = fmax(a.second, b.second);

   }


   static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)

   {

      a = value_type{HUGE_VALF, -HUGE_VALF};

   }


};


template <> struct MinMaxReducer<double>

{

   using value_type = DevicePair<double, double>;


   static MFEM_HOST_DEVICE void Join(value_type &a, value_type b)

   {

      a.first = fmin(a.first, b.first);

      a.second = fmax(a.second, b.second);

   }


   static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)

   {

      a = value_type{HUGE_VAL, -HUGE_VAL};

   }


};


/// @brief i = argmin(a[i], a[j])

///

/// Note: for ties the returned index can correspond to any min entry, not

/// necesarily the first one


template <class T, class I> struct ArgMinReducer

{

   using value_type = DevicePair<T, I>;


   static MFEM_HOST_DEVICE void Join(value_type &a, const value_type &b)

   {

      if (b.first <= a.first)

      {

         a = b;

      }

   }


   static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)

   {

      // Cuda complains about calling host-only constexpr functions in device

      // code without --expt-relaxed-constexpr, wrap into integral_constant to

      // get around this

      a = value_type

      {

         std::integral_constant<T, std::numeric_limits<T>::max()>::value, I{0}};

   }


};


template <class I> struct ArgMinReducer<float, I>

{

   using value_type = DevicePair<float, I>;


   static MFEM_HOST_DEVICE void Join(value_type &a, const value_type &b)

   {

      if (b.first <= a.first)

      {

         a = b;

      }

   }


   static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)

   {

      a = value_type{HUGE_VALF, I{0}};

   }


};


template <class I> struct ArgMinReducer<double, I>

{

   using value_type = DevicePair<double, I>;


   static MFEM_HOST_DEVICE void Join(value_type &a, const value_type &b)

   {

      if (b.first <= a.first)

      {

         a = b;

      }

   }


   static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)

   {

      a = value_type{HUGE_VAL, I{0}};

   }


};


/// @brief i = argmax(a[i], a[j])

///

/// Note: for ties the returned index can correspond to any min entry, not

/// necesarily the first one.


template <class T, class I> struct ArgMaxReducer

{

   using value_type = DevicePair<T, I>;


   static MFEM_HOST_DEVICE void Join(value_type &a, const value_type &b)

   {

      if (a.first <= b.first)

      {

         a = b;

      }

   }


   static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)

   {

      // Cuda complains about calling host-only constexpr functions in device

      // code without --expt-relaxed-constexpr, wrap into integral_constant to

      // get around this

      a = value_type

      {

         std::integral_constant<T, std::numeric_limits<T>::max()>::value, I{0}};

   }


};


template <class I> struct ArgMaxReducer<float, I>

{

   using value_type = DevicePair<float, I>;


   static MFEM_HOST_DEVICE void Join(value_type &a, const value_type &b)

   {

      if (a.first <= b.first)

      {

         a = b;

      }

   }


   static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)

   {

      a = value_type{-HUGE_VALF, I{0}};

   }


};


template <class I> struct ArgMaxReducer<double, I>

{

   using value_type = DevicePair<double, I>;


   static MFEM_HOST_DEVICE void Join(value_type &a, const value_type &b)

   {

      if (a.first <= b.first)

      {

         a = b;

      }

   }


   static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)

   {

      a = value_type{-HUGE_VAL, I{0}};

   }


};


template <class T, class I> struct ArgMinMaxReducer

{

   using value_type = MinMaxLocScalar<T, I>;


   static MFEM_HOST_DEVICE void Join(value_type &a, const value_type &b)

   {

      if (b.min_val <= a.min_val)

      {

         a.min_val = b.min_val;

         a.min_loc = b.min_loc;

      }

      if (b.max_val >= a.max_val)

      {

         a.max_val = b.max_val;

         a.max_loc = b.max_loc;

      }

   }


   static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)

   {

      // Cuda complains about calling host-only constexpr functions in device

      // code without --expt-relaxed-constexpr, wrap into integral_constant to

      // get around this

      a = value_type

      {

         std::integral_constant<T, std::numeric_limits<T>::max()>::value,

         std::integral_constant<T, std::numeric_limits<T>::min()>::value, I(0),

         I(0)};

   }


};


template <class I> struct ArgMinMaxReducer<float, I>

{

   using value_type = MinMaxLocScalar<float, I>;


   static MFEM_HOST_DEVICE void Join(value_type &a, const value_type &b)

   {

      if (b.min_val <= a.min_val)

      {

         a.min_val = b.min_val;

         a.min_loc = b.min_loc;

      }

      if (b.max_val >= a.max_val)

      {

         a.max_val = b.max_val;

         a.max_loc = b.max_loc;

      }

   }


   static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)

   {

      a = value_type{HUGE_VALF, -HUGE_VALF, I(0), I(0)};

   }


};


template <class I> struct ArgMinMaxReducer<double, I>

{

   using value_type = MinMaxLocScalar<double, I>;


   static MFEM_HOST_DEVICE void Join(value_type &a, const value_type &b)

   {

      if (b.min_val <= a.min_val)

      {

         a.min_val = b.min_val;

         a.min_loc = b.min_loc;

      }

      if (b.max_val >= a.max_val)

      {

         a.max_val = b.max_val;

         a.max_loc = b.max_loc;

      }

   }


   static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)

   {

      a = value_type{HUGE_VAL, -HUGE_VAL, I(0), I(0)};

   }


};


namespace internal

{


/**

 @brief Device portion of a reduction over a 1D sequence [0, N)

 @tparam B Reduction body. Must be callable with the signature void(int i, value_type&

 v), where i is the index to evaluate and v is the value to update.

 @tparam R Reducer capable of combining values of type value_type. See reducers.hpp for

 pre-defined reducers.

 */

template<class B, class R> struct reduction_kernel

{

   /// value type body and reducer operate on.

   using value_type = typename R::value_type;

   /// workspace for the intermediate reduction results

   mutable value_type *work;

   B body;

   R reducer;

   /// Length of sequence to reduce over.

   int N;

   /// How many items is each thread responsible for during the serial phase

   int items_per_thread;


   constexpr static MFEM_HOST_DEVICE int max_blocksize() { return 256; }


   /// helper for computing the reduction block size

   static int block_log2(unsigned N)

   {

#if defined(__GNUC__) || defined(__clang__)

      return N ? (sizeof(unsigned) * 8 - __builtin_clz(N)) : 0;

#elif defined(_MSC_VER)

      return sizeof(unsigned) * 8 - __lzclz(N);

#else

      int res = 0;

      while (N)

      {

         N >>= 1;

         ++res;

      }

      return res;

#endif

   }


   MFEM_HOST_DEVICE void operator()(int work_idx) const

   {

      MFEM_SHARED value_type buffer[max_blocksize()];

      reducer.SetInitialValue(buffer[MFEM_THREAD_ID(x)]);

      // serial part

      for (int idx = 0; idx < items_per_thread; ++idx)

      {

         int i = MFEM_THREAD_ID(x) +

                 (idx + work_idx * items_per_thread) * MFEM_THREAD_SIZE(x);

         if (i < N)

         {

            body(i, buffer[MFEM_THREAD_ID(x)]);

         }

         else

         {

            break;

         }

      }

      // binary tree reduction

      for (int i = (MFEM_THREAD_SIZE(x) >> 1); i > 0; i >>= 1)

      {

         MFEM_SYNC_THREAD;

         if (MFEM_THREAD_ID(x) < i)

         {

            reducer.Join(buffer[MFEM_THREAD_ID(x)], buffer[MFEM_THREAD_ID(x) + i]);

         }

      }

      if (MFEM_THREAD_ID(x) == 0)

      {

         work[work_idx] = buffer[0];

      }

   }

};

}


/**

 @brief Performs a 1D reduction on the range [0,N).

 @a res initial value and where the result will be written.

 @a body reduction function body.

 @a reducer helper for joining two reduced values.

 @a use_dev true to perform the reduction on the device, if possible.

 @a workspace temporary workspace used for device reductions. May be resized to

 a larger capacity as needed. Preferably should have MemoryType::MANAGED or

 MemoryType::HOST_PINNED. TODO: replace with internal temporary workspace

 vectors once that's added to the memory manager.

 @tparam T value_type to operate on

 */

template <class T, class B, class R>


void reduce(int N, T &res, B &&body, const R &reducer, bool use_dev,

            Array<T> &workspace)

{

   if (N == 0)

   {

      return;

   }


#if defined(MFEM_USE_CUDA_OR_HIP)

   if (use_dev &&

       mfem::Device::Allows(Backend::CUDA | Backend::HIP | Backend::RAJA_CUDA |

                            Backend::RAJA_HIP))

   {

      using red_type = internal::reduction_kernel<typename std::decay<B>::type,

            typename std::decay<R>::type>;

      // max block size is 256, but can be smaller

      int block_size = std::min<int>(red_type::max_blocksize(),

                                     1ll << red_type::block_log2(N));


      int num_mp = Device::NumMultiprocessors(Device::GetId());

#if defined(MFEM_USE_CUDA)

      // good value of mp_sat found experimentally on Lassen

      constexpr int mp_sat = 8;

#elif defined(MFEM_USE_HIP)

      // good value of mp_sat found experimentally on Tuolumne

      constexpr int mp_sat = 4;

#else

      num_mp = 1;

      constexpr int mp_sat = 1;

#endif

      // determine how many items each thread should sum during the serial

      // portion

      int nblocks = std::min(mp_sat * num_mp, (N + block_size - 1) / block_size);

      int items_per_thread =

         (N + block_size * nblocks - 1) / (block_size * nblocks);


      red_type red{nullptr, std::forward<B>(body), reducer, N, items_per_thread};

      // allocate res to fit block_size entries

      auto mt = workspace.GetMemory().GetMemoryType();

      if (mt != MemoryType::HOST_PINNED && mt != MemoryType::MANAGED)

      {

         mt = MemoryType::HOST_PINNED;

      }

      workspace.SetSize(nblocks, mt);

      auto work = workspace.HostWrite();

      red.work = work;

      forall_2D(nblocks, block_size, 1, std::move(red));

      // wait for results

      MFEM_DEVICE_SYNC;

      for (int i = 0; i < nblocks; ++i)

      {

         reducer.Join(res, work[i]);

      }

      return;

   }

#endif


   for (int i = 0; i < N; ++i)

   {

      body(i, res);

   }

}


} // namespace mfem


#endif // MFEM_REDUCERS_HPP

array.hpp

mfem::Array
Definition array.hpp:48

mfem::Array::GetMemory
Memory< T > & GetMemory()
Return a reference to the Memory object used by the Array.
Definition array.hpp:145

mfem::Array::SetSize
void SetSize(int nsize)
Change the logical size of the array, keep existing entries.
Definition array.hpp:840

mfem::Array::HostWrite
T * HostWrite()
Shortcut for mfem::Write(a.GetMemory(), a.Size(), false).
Definition array.hpp:393

mfem::Device::NumMultiprocessors
static int NumMultiprocessors()
Same as NumMultiprocessors(int), for the currently active device.
Definition device.cpp:736

mfem::Device::Allows
static bool Allows(unsigned long b_mask)
Return true if any of the backends in the backend mask, b_mask, are allowed.
Definition device.hpp:262

mfem::Device::GetId
static int GetId()
Get the device ID of the configured device.
Definition device.hpp:253

forall.hpp

b
real_t b
Definition lissajous.cpp:42

a
real_t a
Definition lissajous.cpp:41

mfem
Definition CodeDocumentation.dox:1

mfem::reduce
void reduce(int N, T &res, B &&body, const R &reducer, bool use_dev, Array< T > &workspace)
Performs a 1D reduction on the range [0,N). res initial value and where the result will be written....
Definition reducers.hpp:532

mfem::forall_2D
void forall_2D(int N, int X, int Y, lambda &&body)
Definition forall.hpp:925

mfem::MemoryType::HOST_PINNED
@ HOST_PINNED
Host memory: pinned (page-locked)

mfem::MemoryType::MANAGED
@ MANAGED

mfem::ArgMaxReducer< double, I >::SetInitialValue
static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)
Definition reducers.hpp:359

mfem::ArgMaxReducer< double, I >::Join
static MFEM_HOST_DEVICE void Join(value_type &a, const value_type &b)
Definition reducers.hpp:352

mfem::ArgMaxReducer< float, I >::Join
static MFEM_HOST_DEVICE void Join(value_type &a, const value_type &b)
Definition reducers.hpp:336

mfem::ArgMaxReducer< float, I >::SetInitialValue
static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)
Definition reducers.hpp:343

mfem::ArgMaxReducer
i = argmax(a[i], a[j])
Definition reducers.hpp:313

mfem::ArgMaxReducer::Join
static MFEM_HOST_DEVICE void Join(value_type &a, const value_type &b)
Definition reducers.hpp:315

mfem::ArgMaxReducer::SetInitialValue
static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)
Definition reducers.hpp:322

mfem::ArgMinMaxReducer< double, I >::Join
static MFEM_HOST_DEVICE void Join(value_type &a, const value_type &b)
Definition reducers.hpp:421

mfem::ArgMinMaxReducer< double, I >::SetInitialValue
static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)
Definition reducers.hpp:435

mfem::ArgMinMaxReducer< float, I >::Join
static MFEM_HOST_DEVICE void Join(value_type &a, const value_type &b)
Definition reducers.hpp:398

mfem::ArgMinMaxReducer< float, I >::SetInitialValue
static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)
Definition reducers.hpp:412

mfem::ArgMinMaxReducer
Definition reducers.hpp:366

mfem::ArgMinMaxReducer::SetInitialValue
static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)
Definition reducers.hpp:382

mfem::ArgMinMaxReducer::Join
static MFEM_HOST_DEVICE void Join(value_type &a, const value_type &b)
Definition reducers.hpp:368

mfem::ArgMinReducer< double, I >::Join
static MFEM_HOST_DEVICE void Join(value_type &a, const value_type &b)
Definition reducers.hpp:295

mfem::ArgMinReducer< double, I >::SetInitialValue
static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)
Definition reducers.hpp:302

mfem::ArgMinReducer< float, I >::SetInitialValue
static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)
Definition reducers.hpp:286

mfem::ArgMinReducer< float, I >::Join
static MFEM_HOST_DEVICE void Join(value_type &a, const value_type &b)
Definition reducers.hpp:279

mfem::ArgMinReducer
i = argmin(a[i], a[j])
Definition reducers.hpp:256

mfem::ArgMinReducer::SetInitialValue
static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)
Definition reducers.hpp:265

mfem::ArgMinReducer::Join
static MFEM_HOST_DEVICE void Join(value_type &a, const value_type &b)
Definition reducers.hpp:258

mfem::BAndReducer
a &= b
Definition reducers.hpp:67

mfem::BAndReducer::Join
static MFEM_HOST_DEVICE void Join(value_type &a, const value_type &b)
Definition reducers.hpp:70

mfem::BAndReducer::value_type
T value_type
Definition reducers.hpp:69

mfem::BAndReducer::SetInitialValue
static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)
Definition reducers.hpp:75

mfem::BOrReducer
a |= b
Definition reducers.hpp:85

mfem::BOrReducer::Join
static MFEM_HOST_DEVICE void Join(value_type &a, const value_type &b)
Definition reducers.hpp:88

mfem::BOrReducer::SetInitialValue
static MFEM_HOST_DEVICE void SetInitialValue(T &a)
Definition reducers.hpp:93

mfem::BOrReducer::value_type
T value_type
Definition reducers.hpp:87

mfem::Backend::RAJA_CUDA
@ RAJA_CUDA
[device] RAJA CUDA backend. Enabled when MFEM_USE_RAJA = YES and MFEM_USE_CUDA = YES.
Definition device.hpp:51

mfem::Backend::HIP
@ HIP
[device] HIP backend. Enabled when MFEM_USE_HIP = YES.
Definition device.hpp:42

mfem::Backend::RAJA_HIP
@ RAJA_HIP
[device] RAJA HIP backend. Enabled when MFEM_USE_RAJA = YES and MFEM_USE_HIP = YES.
Definition device.hpp:54

mfem::Backend::CUDA
@ CUDA
[device] CUDA backend. Enabled when MFEM_USE_CUDA = YES.
Definition device.hpp:40

mfem::DevicePair
Pair of values which can be used in device code.
Definition reducers.hpp:27

mfem::DevicePair::second
B second
Definition reducers.hpp:29

mfem::DevicePair::first
A first
Definition reducers.hpp:28

mfem::MaxReducer< double >::value_type
double value_type
Definition reducers.hpp:183

mfem::MaxReducer< double >::Join
static MFEM_HOST_DEVICE void Join(value_type &a, value_type b)
Definition reducers.hpp:184

mfem::MaxReducer< double >::SetInitialValue
static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)
Definition reducers.hpp:189

mfem::MaxReducer< float >::Join
static MFEM_HOST_DEVICE void Join(value_type &a, value_type b)
Definition reducers.hpp:170

mfem::MaxReducer< float >::value_type
float value_type
Definition reducers.hpp:169

mfem::MaxReducer< float >::SetInitialValue
static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)
Definition reducers.hpp:175

mfem::MaxReducer
a = max(a,b)
Definition reducers.hpp:145

mfem::MaxReducer::Join
static MFEM_HOST_DEVICE void Join(value_type &a, value_type b)
Definition reducers.hpp:147

mfem::MaxReducer::SetInitialValue
static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)
Definition reducers.hpp:161

mfem::MaxReducer::value_type
T value_type
Definition reducers.hpp:146

mfem::MaxReducer::min_val
static constexpr T min_val
Definition reducers.hpp:159

mfem::MinMaxLocScalar
Two pairs for the min/max values and their location indices.
Definition reducers.hpp:34

mfem::MinMaxLocScalar::max_loc
B max_loc
Definition reducers.hpp:38

mfem::MinMaxLocScalar::max_val
A max_val
Definition reducers.hpp:36

mfem::MinMaxLocScalar::min_loc
B min_loc
Definition reducers.hpp:37

mfem::MinMaxLocScalar::min_val
A min_val
Definition reducers.hpp:35

mfem::MinMaxReducer< double >::SetInitialValue
static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)
Definition reducers.hpp:245

mfem::MinMaxReducer< double >::Join
static MFEM_HOST_DEVICE void Join(value_type &a, value_type b)
Definition reducers.hpp:239

mfem::MinMaxReducer< float >::Join
static MFEM_HOST_DEVICE void Join(value_type &a, value_type b)
Definition reducers.hpp:224

mfem::MinMaxReducer< float >::SetInitialValue
static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)
Definition reducers.hpp:230

mfem::MinMaxReducer
a = minmax(a,b)
Definition reducers.hpp:194

mfem::MinMaxReducer::Join
static MFEM_HOST_DEVICE void Join(value_type &a, const value_type &b)
Definition reducers.hpp:196

mfem::MinMaxReducer::SetInitialValue
static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)
Definition reducers.hpp:215

mfem::MinMaxReducer::max_val
static constexpr T max_val
Definition reducers.hpp:213

mfem::MinMaxReducer::min_val
static constexpr T min_val
Definition reducers.hpp:212

mfem::MinReducer< double >::Join
static MFEM_HOST_DEVICE void Join(value_type &a, value_type b)
Definition reducers.hpp:135

mfem::MinReducer< double >::SetInitialValue
static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)
Definition reducers.hpp:140

mfem::MinReducer< double >::value_type
double value_type
Definition reducers.hpp:134

mfem::MinReducer< float >::Join
static MFEM_HOST_DEVICE void Join(value_type &a, value_type b)
Definition reducers.hpp:124

mfem::MinReducer< float >::SetInitialValue
static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)
Definition reducers.hpp:129

mfem::MinReducer< float >::value_type
float value_type
Definition reducers.hpp:123

mfem::MinReducer
a = min(a,b)
Definition reducers.hpp:98

mfem::MinReducer::Join
static MFEM_HOST_DEVICE void Join(value_type &a, value_type b)
Definition reducers.hpp:101

mfem::MinReducer::max_val
static constexpr T max_val
Definition reducers.hpp:113

mfem::MinReducer::SetInitialValue
static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)
Definition reducers.hpp:115

mfem::MinReducer::value_type
T value_type
Definition reducers.hpp:99

mfem::MultReducer
a *= b
Definition reducers.hpp:55

mfem::MultReducer::SetInitialValue
static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)
Definition reducers.hpp:62

mfem::MultReducer::Join
static MFEM_HOST_DEVICE void Join(value_type &a, const value_type &b)
Definition reducers.hpp:57

mfem::MultReducer::value_type
T value_type
Definition reducers.hpp:56

mfem::SumReducer
a += b
Definition reducers.hpp:43

mfem::SumReducer::Join
static MFEM_HOST_DEVICE void Join(value_type &a, const value_type &b)
Definition reducers.hpp:45

mfem::SumReducer::value_type
T value_type
Definition reducers.hpp:44

mfem::SumReducer::SetInitialValue
static MFEM_HOST_DEVICE void SetInitialValue(value_type &a)
Definition reducers.hpp:50