6#include <thrust/complex.h>
12template<
class value_type>
13inline cudaDataType_t
getCudaDataType(){ assert(
false &&
"CUDA Type not supported!\n" );
return CUDA_R_64F; }
23template<
class value_type>
24inline cusparseIndexType_t
getCudaIndexType(){ assert(
false &&
"CUDA Type not supported!\n" );
return CUSPARSE_INDEX_32I; }
33 cusparseStatus_t
error()
const {
return m_error;}
34 cusparseStatus_t&
error() {
return m_error;}
35 char const*
what() const noexcept{
36 return cusparseGetErrorString(m_error);}
38 cusparseStatus_t m_error;
50 if( err != CUSPARSE_STATUS_SUCCESS)
69 cusparseHandle_t m_handle;
72 cusparseCreate( &m_handle);
76 cusparseDestroy(m_handle);
79 cusparseHandle_t
handle()
const {
return m_handle;}
91 template<
class I,
class V>
93 size_t num_rows,
size_t num_cols,
size_t nnz,
94 const I* pos ,
const I* idx,
const V* val)
96 update( num_rows, num_cols, nnz, pos, idx, val);
121 if ( m_dBuffer !=
nullptr)
122 cudaFree( m_dBuffer);
124 cusparseDestroySpMat( m_matA);
128 std::swap( m_active, src.m_active);
129 std::swap( m_matA, src.m_matA);
130 std::swap( m_dBuffer, src.m_dBuffer);
131 std::swap( m_bufferSize, src.m_bufferSize);
135 template<
class I,
class V>
137 size_t num_rows,
size_t num_cols,
size_t nnz,
138 const I* pos ,
const I* idx,
const V* val)
142 cusparseDnVecDescr_t vecX;
143 cusparseDnVecDescr_t vecY;
144 err = cusparseCreateCsr( &m_matA, num_rows, num_cols, nnz,
145 const_cast<I*
>(pos),
const_cast<I*
>(idx),
const_cast<V*
>(val),
149 cudaMalloc( &x_ptr, num_cols*
sizeof(V));
152 cudaMalloc( &y_ptr, num_cols*
sizeof(V));
154 size_t bufferSize = 0;
155 V alpha = 1, beta = 0;
158 CUSPARSE_OPERATION_NON_TRANSPOSE, &alpha, m_matA, vecX, &beta, vecY,
161 if ( m_dBuffer !=
nullptr)
162 cudaFree( m_dBuffer);
163 cudaMalloc( &m_dBuffer, bufferSize);
166#if (CUDART_VERSION >= 12040)
168 CUSPARSE_OPERATION_NON_TRANSPOSE, &alpha, m_matA, vecX, &beta, vecY,
172 err = cusparseDestroyDnVec( vecX);
173 err = cusparseDestroyDnVec( vecY);
179 cusparseSpMatDescr_t
getSpMat()
const {
return m_matA;}
182 bool m_active =
false;
183 cusparseSpMatDescr_t m_matA;
184 void * m_dBuffer =
nullptr;
185 size_t m_bufferSize = 0;
189template<
class I,
class V,
class value_type,
class C1,
class C2>
192 size_t A_num_rows,
size_t A_num_cols,
size_t A_nnz,
193 const I* A_pos ,
const I* A_idx,
const V* A_val,
194 value_type alpha, value_type beta,
const C1* x_ptr, C2* y_ptr
199 cusparseDnVecDescr_t vecX;
200 cusparseDnVecDescr_t vecY;
201 err = cusparseCreateDnVec( &vecX, A_num_cols,
const_cast<C1*
>(x_ptr),
getCudaDataType<C1>());
205 cache.
update<I,V>( A_num_rows, A_num_cols, A_nnz, A_pos, A_idx, A_val);
209 CUSPARSE_SPMV_CSR_ALG1, cache.
getBuffer());
211 err = cusparseDestroyDnVec( vecX);
212 err = cusparseDestroyDnVec( vecY);
void spmv_gpu_kernel(CSRCache_gpu &cache, size_t A_num_rows, size_t A_num_cols, size_t A_nnz, const I *A_pos, const I *A_idx, const V *A_val, value_type alpha, value_type beta, const C1 *x_ptr, C2 *y_ptr)
Definition sparsematrix_gpu.cuh:190
cudaDataType_t getCudaDataType< double >()
Definition sparsematrix_gpu.cuh:17
cusparseIndexType_t getCudaIndexType< int >()
Definition sparsematrix_gpu.cuh:25
cudaDataType_t getCudaDataType< float >()
Definition sparsematrix_gpu.cuh:16
cusparseIndexType_t getCudaIndexType< signed long int >()
Definition sparsematrix_gpu.cuh:26
cudaDataType_t getCudaDataType()
Definition sparsematrix_gpu.cuh:13
cudaDataType_t getCudaDataType< int >()
Definition sparsematrix_gpu.cuh:15
cusparseIndexType_t getCudaIndexType()
Definition sparsematrix_gpu.cuh:24
bool cusparse_is_initialized
Definition sparsematrix_gpu.cuh:85
This is the namespace for all functions and classes defined and used by the discontinuous Galerkin li...
Definition sparsematrix_gpu.cuh:89
CSRCache_gpu & operator=(CSRCache_gpu &&src)
Definition sparsematrix_gpu.cuh:114
CSRCache_gpu & operator=(const CSRCache_gpu &src)
Definition sparsematrix_gpu.cuh:106
CSRCache_gpu(CSRCache_gpu &&src)
Definition sparsematrix_gpu.cuh:102
bool isUpToDate() const
Definition sparsematrix_gpu.cuh:134
cusparseSpMatDescr_t getSpMat() const
Definition sparsematrix_gpu.cuh:179
void update(size_t num_rows, size_t num_cols, size_t nnz, const I *pos, const I *idx, const V *val)
Definition sparsematrix_gpu.cuh:136
size_t getBufferSize()
Definition sparsematrix_gpu.cuh:177
CSRCache_gpu(const CSRCache_gpu &src)
Definition sparsematrix_gpu.cuh:98
void swap(CSRCache_gpu &src)
Definition sparsematrix_gpu.cuh:126
void * getBuffer()
Definition sparsematrix_gpu.cuh:178
void forget()
Definition sparsematrix_gpu.cuh:133
CSRCache_gpu(size_t num_rows, size_t num_cols, size_t nnz, const I *pos, const I *idx, const V *val)
Definition sparsematrix_gpu.cuh:92
~CSRCache_gpu()
Definition sparsematrix_gpu.cuh:119
Definition sparsematrix_gpu.cuh:42
CusparseErrorHandle operator()(cusparseStatus_t err)
Definition sparsematrix_gpu.cuh:48
CusparseErrorHandle operator=(cusparseStatus_t err)
Definition sparsematrix_gpu.cuh:43
Definition sparsematrix_gpu.cuh:30
CusparseError(cusparseStatus_t error)
Definition sparsematrix_gpu.cuh:31
cusparseStatus_t & error()
Definition sparsematrix_gpu.cuh:34
cusparseStatus_t error() const
Definition sparsematrix_gpu.cuh:33
char const * what() const noexcept
Definition sparsematrix_gpu.cuh:35
Definition sparsematrix_gpu.cuh:60
CusparseHandle(const CusparseHandle &)=delete
void operator=(const CusparseHandle &)=delete
static CusparseHandle & getInstance()
Definition sparsematrix_gpu.cuh:61
cusparseHandle_t handle() const
Definition sparsematrix_gpu.cuh:79