Discontinuous Galerkin Library
#include "dg/algorithm.h"
Loading...
Searching...
No Matches
sparsematrix_omp.h
Go to the documentation of this file.
1#pragma once
2namespace dg
3{
4namespace detail
5{
6// !!! Do not edit by hand:
7// 1. copy CSRCache_cpu and spmv_cpu_kernel from sparsematrix_cpu.h
8// 2. uncomment the pragma omp parallel
9// 3. Rename cpu to omp
10
12{
13 void forget(){}
14};
15//y = alpha A*x + beta y
16template<class I, class V, class value_type, class C1, class C2>
18 CSRCache_omp& cache,
19 size_t A_num_rows, size_t A_num_cols, size_t A_nnz,
20 const I* RESTRICT A_pos , const I* RESTRICT A_idx, const V* RESTRICT A_val,
21 value_type alpha, value_type beta, const C1* RESTRICT x_ptr, C2* RESTRICT y_ptr
22)
23{
24 if( beta == value_type(1))
25 {
26 #pragma omp for nowait
27 for(int i = 0; i < (int)A_num_rows; i++)
28 {
29 for (int jj = A_pos[i]; jj < A_pos[i+1]; jj++)
30 {
31 int j = A_idx[jj];
32 y_ptr[i] = DG_FMA( alpha*A_val[jj], x_ptr[j], y_ptr[i]);
33 }
34 }
35 }
36 else
37 {
38 #pragma omp for nowait
39 for(int i = 0; i < (int)A_num_rows; i++)
40 {
41 value_type temp = 0;
42 for (int jj = A_pos[i]; jj < A_pos[i+1]; jj++)
43 {
44 int j = A_idx[jj];
45 temp = DG_FMA( alpha*A_val[jj], x_ptr[j], temp);
46 }
47
48 y_ptr[i] = DG_FMA( beta, y_ptr[i], temp);
49 }
50 }
51}
52
53}//namespace detail
54}//namespace dg
void spmv_omp_kernel(CSRCache_omp &cache, size_t A_num_rows, size_t A_num_cols, size_t A_nnz, const I *RESTRICT A_pos, const I *RESTRICT A_idx, const V *RESTRICT A_val, value_type alpha, value_type beta, const C1 *RESTRICT x_ptr, C2 *RESTRICT y_ptr)
Definition sparsematrix_omp.h:17
This is the namespace for all functions and classes defined and used by the discontinuous Galerkin li...
Definition sparsematrix_omp.h:12
void forget()
Definition sparsematrix_omp.h:13