docs/cuda__manager_8h_source.html

/*

 * Copyright (c) 2013-2015:  G-CSC, Goethe University Frankfurt

 * Author: Martin Rupp

 *

 * This file is part of UG4.

 *

 * UG4 is free software: you can redistribute it and/or modify it under the

 * terms of the GNU Lesser General Public License version 3 (as published by the

 * Free Software Foundation) with the following additional attribution

 * requirements (according to LGPL/GPL v3 §7):

 *

 * (1) The following notice must be displayed in the Appropriate Legal Notices

 * of covered and combined works: "Based on UG4 (www.ug4.org/license)".

 *

 * (2) The following notice must be displayed at a prominent place in the

 * terminal output of covered works: "Based on UG4 (www.ug4.org/license)".

 *

 * (3) The following bibliography is recommended for citation and must be

 * preserved in all covered files:

 * "Reiter, S., Vogel, A., Heppner, I., Rupp, M., and Wittum, G. A massively

 *   parallel geometric multigrid solver on hierarchically distributed grids.

 *   Computing and visualization in science 16, 4 (2013), 151-164"

 * "Vogel, A., Reiter, S., Rupp, M., Nägel, A., and Wittum, G. UG4 -- a novel

 *   flexible software system for simulating pde based models on high performance

 *   computers. Computing and visualization in science 16, 4 (2013), 165-179"

 *

 * This program is distributed in the hope that it will be useful,

 * but WITHOUT ANY WARRANTY; without even the implied warranty of

 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

 * GNU Lesser General Public License for more details.

 */


#ifndef CUDAManager_H

#define CUDAManager_H


#define USE_CUSPARSE


/* Using updated (v2) interfaces to cublas and cusparse */

#include <cuda_runtime.h>


#ifdef USE_CUSPARSE

#include <cusparse_v2.h>

#endif


#include <cublas_v2.h>

#include <vector>


// Utilities and system includes

#include "common/error.h"

#include "common/log.h"


#include <string>


namespace ug{

extern DebugID DID_CUDA;


const char *CUDAError(int err);


template<typename T>


inline void CudaCheckStatus(T status, const char * file, int line)

{

  unsigned int s = static_cast<unsigned int>(status );

  UG_COND_THROW(status != 0, "CUDA error at " << file << ":" << line << " " << s << " = " << ug::CUDAError(status) );

}

inline void CudaCheckStatus(T status, const char * file, int line) {…}


#define CUDA_CHECK_STATUS(status ) CudaCheckStatus(status, __FILE__, __LINE__)


#define CUDA_CHECK_SUCCESS(err, desc) \

if(err != cudaSuccess)\

{\

    UG_THROW("Error in " << __FUNCTION__ << ": CUDA ERROR " << err <<":\n" <<\

        ug::CUDAError(err) << "\n----------------------------\n" << desc << "\n");\

}

#define CUDA_CHECK_SUCCESS(err, desc) \ …


template<typename T>


T *MyCudaAlloc(size_t N)

{

  UG_DLOG(DID_CUDA, 2, "CUDA: Allocating " <<  sizeof(T)*N  << " bytes.\n");


  T *p;

  cudaError_t err = cudaMalloc ((void**) &p, sizeof(T)*N);

  if(err != cudaSuccess)

  {

    UG_THROW("Error in " << __FUNCTION__ << "when allocating " << sizeof(T)*N << " bytes. CUDA ERROR " << err <<": " <<

        ug::CUDAError(err));

  }

  return p;

}

T *MyCudaAlloc(size_t N) {…}


class CUDAManager

{

public:

    virtual ~CUDAManager();

    void init();

    static CUDAManager &get_instance();


#ifdef USE_CUSPARSE

public:

    static inline cusparseHandle_t get_cusparseHandle() { return get_instance().cusparseHandle; }

private:

    cusparseHandle_t cusparseHandle;

#endif


public:

    static inline cublasHandle_t get_cublasHandle() { return get_instance().cublasHandle; }

    size_t m_maxThreadsPerBlock;


    template<typename T>


    T *get_temp_buffer(size_t n)

    {

      size_t N = n*sizeof(T);

      if(N < m_tempSize) return (T*)m_tempBuffer;


      UG_DLOG(DID_CUDA, 2, "CUDA: Allocating Temp Buffer " <<  N  << " bytes.\n");

      if(m_tempBuffer)

        cudaFree(m_tempBuffer);


      m_tempBuffer = MyCudaAlloc<char>(n);


      return (T*)m_tempBuffer;

    }

    T *get_temp_buffer(size_t n) {…}


    template<typename T>


    T *get_temp_return_buffer()

  {

      return (T*)m_tempRetBuffer;

  }

    T *get_temp_return_buffer() {…}


    static void get_cuda_devices(std::vector<cudaDeviceProp> &devices);

    static int get_max_multiprocessor_cuda_device();


private:

    cublasHandle_t cublasHandle;

    void *m_tempBuffer;

    void *m_tempRetBuffer;

    size_t m_tempSize;

};

class CUDAManager {…};


template<typename T>


inline void CudaCpyToDevice(typename T::value_type *dest, T &vec)

{

  UG_DLOG(DID_CUDA, 2, "Copying " << vec.size() << " to device\n");

  //std::cout << "copy!\n";

  CUDA_CHECK_SUCCESS( cudaMemcpy(dest, &vec[0], vec.size()*sizeof(typename T::value_type), cudaMemcpyHostToDevice),

      "cudaMemcpy vec size " << vec.size());

}

inline void CudaCpyToDevice(typename T::value_type *dest, T &vec) {…}


template<typename T>


inline void CudaCpyToHost(T &dest, typename T::value_type *src)

{

  UG_DLOG(DID_CUDA, 2, "Copying " << dest.size() << " to host\n");

  //std::cout << "copy!\n";

  CUDA_CHECK_SUCCESS( cudaMemcpy(&dest[0], src, dest.size()*sizeof(typename T::value_type), cudaMemcpyDeviceToHost),

      "cudaMemcpy dest size " << dest.size())

}

inline void CudaCpyToHost(T &dest, typename T::value_type *src) {…}


template<typename T>


inline typename T::value_type *CudaCreateAndCopyToDevice(T &vec)

{

  UG_DLOG(DID_CUDA, 2, "Create and Copying " << vec.size() << " to host\n");

  typename T::value_type *dest;

  int N = vec.size()*sizeof(typename T::value_type);

  CUDA_CHECK_SUCCESS( cudaMalloc((void **)&dest, N),

      "Error at cudaMalloc of " << N << " bytes");


  CudaCpyToDevice(dest, vec);

  return dest;

}

inline typename T::value_type *CudaCreateAndCopyToDevice(T &vec) {…}


template<typename T>


T CUDA_GetElementFromDevice(T *p, size_t i=0)

{

  T t;

  cudaMemcpy(&t, p+i, sizeof(T), cudaMemcpyDeviceToHost);

  return t;

}

T CUDA_GetElementFromDevice(T *p, size_t i=0) {…}

}

#endif  /* CUDAManager_H */

p
parameterString p

s
parameterString s

ug::CUDAManager
Definition cuda_manager.h:94

ug::CUDAManager::get_cublasHandle
static cublasHandle_t get_cublasHandle()
Definition cuda_manager.h:108

ug::CUDAManager::cublasHandle
cublasHandle_t cublasHandle
Definition cuda_manager.h:136

ug::CUDAManager::init
void init()
Definition cuda_manager.cpp:83

ug::CUDAManager::get_max_multiprocessor_cuda_device
static int get_max_multiprocessor_cuda_device()
Definition cuda_manager.cpp:54

ug::CUDAManager::get_cusparseHandle
static cusparseHandle_t get_cusparseHandle()
Definition cuda_manager.h:102

ug::CUDAManager::cusparseHandle
cusparseHandle_t cusparseHandle
Definition cuda_manager.h:104

ug::CUDAManager::m_maxThreadsPerBlock
size_t m_maxThreadsPerBlock
Definition cuda_manager.h:109

ug::CUDAManager::get_temp_buffer
T * get_temp_buffer(size_t n)
Definition cuda_manager.h:112

ug::CUDAManager::m_tempRetBuffer
void * m_tempRetBuffer
Definition cuda_manager.h:138

ug::CUDAManager::get_temp_return_buffer
T * get_temp_return_buffer()
Definition cuda_manager.h:127

ug::CUDAManager::m_tempBuffer
void * m_tempBuffer
Definition cuda_manager.h:137

ug::CUDAManager::get_instance
static CUDAManager & get_instance()
Definition cuda_manager.cpp:153

ug::CUDAManager::m_tempSize
size_t m_tempSize
Definition cuda_manager.h:139

ug::CUDAManager::~CUDAManager
virtual ~CUDAManager()
Definition cuda_manager.cpp:68

ug::CUDAManager::get_cuda_devices
static void get_cuda_devices(std::vector< cudaDeviceProp > &devices)
Definition cuda_manager.cpp:45

ug::DebugID
Definition debug_id.h:94

error.h

CUDA_CHECK_SUCCESS
#define CUDA_CHECK_SUCCESS(err, desc)
Definition cuda_manager.h:69

UG_THROW
#define UG_THROW(msg)
Definition error.h:57

UG_DLOG
#define UG_DLOG(__debugID__, level, msg)
Definition log.h:298

UG_COND_THROW
#define UG_COND_THROW(cond, msg)
UG_COND_THROW(cond, msg) : performs a UG_THROW(msg) if cond == true.
Definition error.h:61

log.h

ug
the ug namespace

ug::MyCudaAlloc
T * MyCudaAlloc(size_t N)
Definition cuda_manager.h:78

ug::CudaCreateAndCopyToDevice
T::value_type * CudaCreateAndCopyToDevice(T &vec)
Definition cuda_manager.h:163

ug::DID_CUDA
DebugID DID_CUDA("CUDA")
Definition cuda_manager.h:55

ug::CudaCpyToHost
void CudaCpyToHost(T &dest, typename T::value_type *src)
Definition cuda_manager.h:153

ug::CudaCpyToDevice
void CudaCpyToDevice(typename T::value_type *dest, T &vec)
Definition cuda_manager.h:144

ug::CUDA_GetElementFromDevice
T CUDA_GetElementFromDevice(T *p, size_t i=0)
Definition cuda_manager.h:176

ug::CUDAError
const char * CUDAError(int err)
Definition cuda_error.cpp:35

ug::CudaCheckStatus
void CudaCheckStatus(T status, const char *file, int line)
Definition cuda_manager.h:60