4.0/cuda_8hpp_source.html

 // Copyright (c) 2010, Lawrence Livermore National Security, LLC. Produced at

 // the Lawrence Livermore National Laboratory. LLNL-CODE-443211. All Rights

 // reserved. See file COPYRIGHT for details.

 //

 // This file is part of the MFEM library. For more information and source code

 // availability see http://mfem.org.

 //

 // MFEM is free software; you can redistribute it and/or modify it under the

 // terms of the GNU Lesser General Public License (as published by the Free

 // Software Foundation) version 2.1 dated February 1999.


 #ifndef MFEM_CUDA_HPP

 #define MFEM_CUDA_HPP


 #include "../config/config.hpp"

 #include "error.hpp"


 #ifdef MFEM_USE_CUDA

 #include <cuda_runtime.h>

 #include <cuda.h>

 #endif


 // CUDA block size used by MFEM.

 #define MFEM_CUDA_BLOCKS 256


 #ifdef MFEM_USE_CUDA

 #define MFEM_DEVICE __device__

 #define MFEM_HOST_DEVICE __host__ __device__

 // Define a CUDA error check macro, MFEM_CUDA_CHECK(x), where x returns/is of

 // type 'cudaError_t'. This macro evaluates 'x' and raises an error if the

 // result is not cudaSuccess.

 #define MFEM_CUDA_CHECK(x) \

    do \

    { \

       cudaError_t err = (x); \

       if (err != cudaSuccess) \

       { \

          mfem_cuda_error(err, #x, _MFEM_FUNC_NAME, __FILE__, __LINE__); \

       } \

    } \

    while (0)

 #else

 #define MFEM_DEVICE

 #define MFEM_HOST_DEVICE

 #endif // MFEM_USE_CUDA


 // Define the MFEM inner threading macros

 #if defined(MFEM_USE_CUDA) && defined(__CUDA_ARCH__)

 #define MFEM_SHARED __shared__

 #define MFEM_SYNC_THREAD __syncthreads()

 #define MFEM_THREAD_ID(k) threadIdx.k

 #define MFEM_THREAD_SIZE(k) blockDim.k

 #define MFEM_FOREACH_THREAD(i,k,N) for(int i=threadIdx.k; i<N; i+=blockDim.k)

 #else

 #define MFEM_SHARED

 #define MFEM_SYNC_THREAD

 #define MFEM_THREAD_ID(k) 0

 #define MFEM_THREAD_SIZE(k) 1

 #define MFEM_FOREACH_THREAD(i,k,N) for(int i=0; i<N; i++)

 #endif


 namespace mfem

 {


 #ifdef MFEM_USE_CUDA

 // Function used by the macro MFEM_CUDA_CHECK.

 void mfem_cuda_error(cudaError_t err, const char *expr, const char *func,

                      const char *file, int line);

 #endif


 /// Allocates device memory

 void* CuMemAlloc(void **d_ptr, size_t bytes);


 /// Frees device memory

 void* CuMemFree(void *d_ptr);


 /// Copies memory from Host to Device

 void* CuMemcpyHtoD(void *d_dst, const void *h_src, size_t bytes);


 /// Copies memory from Host to Device

 void* CuMemcpyHtoDAsync(void *d_dst, const void *h_src, size_t bytes);


 /// Copies memory from Device to Device

 void* CuMemcpyDtoD(void *d_dst, const void *d_src, size_t bytes);


 /// Copies memory from Device to Device

 void* CuMemcpyDtoDAsync(void *d_dst, const void *d_src, size_t bytes);


 /// Copies memory from Device to Host

 void* CuMemcpyDtoH(void *h_dst, const void *d_src, size_t bytes);


 /// Copies memory from Device to Host

 void* CuMemcpyDtoHAsync(void *h_dst, const void *d_src, size_t bytes);


 } // namespace mfem


 #endif // MFEM_CUDA_HPP

mfem::CuMemcpyHtoD
void * CuMemcpyHtoD(void *dst, const void *src, size_t bytes)
Copies memory from Host to Device.
Definition: cuda.cpp:64

mfem::CuMemFree
void * CuMemFree(void *dptr)
Frees device memory.
Definition: cuda.cpp:49

mfem::mfem_cuda_error
void mfem_cuda_error(cudaError_t err, const char *expr, const char *func, const char *file, int line)
Definition: cuda.cpp:23

mfem::CuMemcpyDtoD
void * CuMemcpyDtoD(void *dst, const void *src, size_t bytes)
Copies memory from Device to Device.
Definition: cuda.cpp:87

mfem::CuMemcpyDtoDAsync
void * CuMemcpyDtoDAsync(void *dst, const void *src, size_t bytes)
Copies memory from Device to Device.
Definition: cuda.cpp:102

mfem::err
OutStream err(std::cerr)
Global stream used by the library for standard error output. Initially it uses the same std::streambu...
Definition: globals.hpp:69

error.hpp

mfem::CuMemcpyDtoHAsync
void * CuMemcpyDtoHAsync(void *dst, const void *src, size_t bytes)
Copies memory from Device to Host.
Definition: cuda.cpp:125

mfem::CuMemcpyHtoDAsync
void * CuMemcpyHtoDAsync(void *dst, const void *src, size_t bytes)
Copies memory from Host to Device.
Definition: cuda.cpp:79

mfem::CuMemAlloc
void * CuMemAlloc(void **dptr, size_t bytes)
Allocates device memory.
Definition: cuda.cpp:34

mfem::CuMemcpyDtoH
void * CuMemcpyDtoH(void *dst, const void *src, size_t bytes)
Copies memory from Device to Host.
Definition: cuda.cpp:110