4.1/cuda_8cpp_source.html

 // Copyright (c) 2010-2020, Lawrence Livermore National Security, LLC. Produced

 // at the Lawrence Livermore National Laboratory. All Rights reserved. See files

 // LICENSE and NOTICE for details. LLNL-CODE-806117.

 //

 // This file is part of the MFEM library. For more information and source code

 // availability visit https://mfem.org.

 //

 // MFEM is free software; you can redistribute it and/or modify it under the

 // terms of the BSD-3 license. We welcome feedback and contributions, see file

 // CONTRIBUTING.md for details.


 #include "cuda.hpp"

 #include "globals.hpp"


 namespace mfem

 {


 // Internal debug option, useful for tracking CUDA allocations, deallocations

 // and transfers.

 // #define MFEM_TRACK_CUDA_MEM


 #ifdef MFEM_USE_CUDA

 void mfem_cuda_error(cudaError_t err, const char *expr, const char *func,

                      const char *file, int line)

 {

    mfem::err << "\n\nCUDA error: (" << expr << ") failed with error:\n --> "

              << cudaGetErrorString(err)

              << "\n ... in function: " << func

              << "\n ... in file: " << file << ':' << line << '\n';

    mfem_error();

 }

 #endif


 void* CuMemAlloc(void** dptr, size_t bytes)

 {

 #ifdef MFEM_USE_CUDA

 #ifdef MFEM_TRACK_CUDA_MEM

    mfem::out << "CuMemAlloc(): allocating " << bytes << " bytes ... "

              << std::flush;

 #endif

    MFEM_GPU_CHECK(cudaMalloc(dptr, bytes));

 #ifdef MFEM_TRACK_CUDA_MEM

    mfem::out << "done: " << *dptr << std::endl;

 #endif

 #endif

    return *dptr;

 }


 void* CuMallocManaged(void** dptr, size_t bytes)

 {

 #ifdef MFEM_USE_CUDA

 #ifdef MFEM_TRACK_CUDA_MEM

    mfem::out << "CuMallocManaged(): allocating " << bytes << " bytes ... "

              << std::flush;

 #endif

    MFEM_GPU_CHECK(cudaMallocManaged(dptr, bytes));

 #ifdef MFEM_TRACK_CUDA_MEM

    mfem::out << "done: " << *dptr << std::endl;

 #endif

 #endif

    return *dptr;

 }


 void* CuMemFree(void *dptr)

 {

 #ifdef MFEM_USE_CUDA

 #ifdef MFEM_TRACK_CUDA_MEM

    mfem::out << "CuMemFree(): deallocating memory @ " << dptr << " ... "

              << std::flush;

 #endif

    MFEM_GPU_CHECK(cudaFree(dptr));

 #ifdef MFEM_TRACK_CUDA_MEM

    mfem::out << "done." << std::endl;

 #endif

 #endif

    return dptr;

 }


 void* CuMemcpyHtoD(void* dst, const void* src, size_t bytes)

 {

 #ifdef MFEM_USE_CUDA

 #ifdef MFEM_TRACK_CUDA_MEM

    mfem::out << "CuMemcpyHtoD(): copying " << bytes << " bytes from "

              << src << " to " << dst << " ... " << std::flush;

 #endif

    MFEM_GPU_CHECK(cudaMemcpy(dst, src, bytes, cudaMemcpyHostToDevice));

 #ifdef MFEM_TRACK_CUDA_MEM

    mfem::out << "done." << std::endl;

 #endif

 #endif

    return dst;

 }


 void* CuMemcpyHtoDAsync(void* dst, const void* src, size_t bytes)

 {

 #ifdef MFEM_USE_CUDA

    MFEM_GPU_CHECK(cudaMemcpyAsync(dst, src, bytes, cudaMemcpyHostToDevice));

 #endif

    return dst;

 }


 void* CuMemcpyDtoD(void *dst, const void *src, size_t bytes)

 {

 #ifdef MFEM_USE_CUDA

 #ifdef MFEM_TRACK_CUDA_MEM

    mfem::out << "CuMemcpyDtoD(): copying " << bytes << " bytes from "

              << src << " to " << dst << " ... " << std::flush;

 #endif

    MFEM_GPU_CHECK(cudaMemcpy(dst, src, bytes, cudaMemcpyDeviceToDevice));

 #ifdef MFEM_TRACK_CUDA_MEM

    mfem::out << "done." << std::endl;

 #endif

 #endif

    return dst;

 }


 void* CuMemcpyDtoDAsync(void* dst, const void *src, size_t bytes)

 {

 #ifdef MFEM_USE_CUDA

    MFEM_GPU_CHECK(cudaMemcpyAsync(dst, src, bytes, cudaMemcpyDeviceToDevice));

 #endif

    return dst;

 }


 void* CuMemcpyDtoH(void *dst, const void *src, size_t bytes)

 {

 #ifdef MFEM_USE_CUDA

 #ifdef MFEM_TRACK_CUDA_MEM

    mfem::out << "CuMemcpyDtoH(): copying " << bytes << " bytes from "

              << src << " to " << dst << " ... " << std::flush;

 #endif

    MFEM_GPU_CHECK(cudaMemcpy(dst, src, bytes, cudaMemcpyDeviceToHost));

 #ifdef MFEM_TRACK_CUDA_MEM

    mfem::out << "done." << std::endl;

 #endif

 #endif

    return dst;

 }


 void* CuMemcpyDtoHAsync(void *dst, const void *src, size_t bytes)

 {

 #ifdef MFEM_USE_CUDA

    MFEM_GPU_CHECK(cudaMemcpyAsync(dst, src, bytes, cudaMemcpyDeviceToHost));

 #endif

    return dst;

 }


 void CuCheckLastError()

 {

 #ifdef MFEM_USE_CUDA

    MFEM_GPU_CHECK(cudaGetLastError());

 #endif

 }


 int CuGetDeviceCount()

 {

    int num_gpus = -1;

 #ifdef MFEM_USE_CUDA

    MFEM_GPU_CHECK(cudaGetDeviceCount(&num_gpus));

 #endif

    return num_gpus;

 }


 } // namespace mfem

mfem::CuMemcpyHtoD
void * CuMemcpyHtoD(void *dst, const void *src, size_t bytes)
Copies memory from Host to Device.
Definition: cuda.cpp:79

mfem::CuMemFree
void * CuMemFree(void *dptr)
Frees device memory.
Definition: cuda.cpp:64

mfem::CuCheckLastError
void CuCheckLastError()
Check the error code returned by cudaGetLastError(), aborting on error.
Definition: cuda.cpp:148

mfem::CuGetDeviceCount
int CuGetDeviceCount()
Get the number of CUDA devices.
Definition: cuda.cpp:155

mfem::CuMallocManaged
void * CuMallocManaged(void **dptr, size_t bytes)
Allocates managed device memory.
Definition: cuda.cpp:49

mfem::mfem_cuda_error
void mfem_cuda_error(cudaError_t err, const char *expr, const char *func, const char *file, int line)
Definition: cuda.cpp:23

mfem::mfem_error
void mfem_error(const char *msg)
Function called when an error is encountered. Used by the macros MFEM_ABORT, MFEM_ASSERT, MFEM_VERIFY.
Definition: error.cpp:153

mfem::CuMemcpyDtoD
void * CuMemcpyDtoD(void *dst, const void *src, size_t bytes)
Copies memory from Device to Device.
Definition: cuda.cpp:102

mfem::CuMemcpyDtoDAsync
void * CuMemcpyDtoDAsync(void *dst, const void *src, size_t bytes)
Copies memory from Device to Device.
Definition: cuda.cpp:117

mfem::err
OutStream err(std::cerr)
Global stream used by the library for standard error output. Initially it uses the same std::streambu...
Definition: globals.hpp:71

cuda.hpp

mfem::CuMemcpyDtoHAsync
void * CuMemcpyDtoHAsync(void *dst, const void *src, size_t bytes)
Copies memory from Device to Host.
Definition: cuda.cpp:140

mfem::CuMemcpyHtoDAsync
void * CuMemcpyHtoDAsync(void *dst, const void *src, size_t bytes)
Copies memory from Host to Device.
Definition: cuda.cpp:94

globals.hpp

mfem::out
OutStream out(std::cout)
Global stream used by the library for standard output. Initially it uses the same std::streambuf as s...
Definition: globals.hpp:66

mfem::CuMemAlloc
void * CuMemAlloc(void **dptr, size_t bytes)
Allocates device memory.
Definition: cuda.cpp:34

mfem::CuMemcpyDtoH
void * CuMemcpyDtoH(void *dst, const void *src, size_t bytes)
Copies memory from Device to Host.
Definition: cuda.cpp:125