18struct TensorMultiply2d
20 template<
class VL,
class V0,
class V1,
class V2,
class VM,
class V3,
class V4>
22 void operator() ( VL lambda, V0 t00, V0 t01, V0 t10, V0 t11,
23 V1 in0, V2 in1, VM mu, V3& out0, V4& out1)
const
25 auto tmp0 = DG_FMA(t00,in0 , t01*in1);
26 auto tmp1 = DG_FMA(t10,in0 , t11*in1);
28 out1 = DG_FMA( lambda, tmp1, temp);
30 out0 = DG_FMA( lambda, tmp0, temp);
34struct TensorMultiply3d
36 template<
class VL,
class V0,
class V1,
class V2,
class V3,
class VM,
class V4,
class V5,
class V6>
38 void operator() ( VL lambda,
39 V0 t00, V0 t01, V0 t02,
40 V0 t10, V0 t11, V0 t12,
41 V0 t20, V0 t21, V0 t22,
42 V1 in0, V2 in1, V3 in2,
44 V4& out0, V5& out1, V6& out2)
const
46 auto tmp0 = DG_FMA( t00,in0 , (DG_FMA( t01,in1 , t02*in2)));
47 auto tmp1 = DG_FMA( t10,in0 , (DG_FMA( t11,in1 , t12*in2)));
48 auto tmp2 = DG_FMA( t20,in0 , (DG_FMA( t21,in1 , t22*in2)));
50 out2 = DG_FMA( lambda, tmp2, temp);
52 out1 = DG_FMA( lambda, tmp1, temp);
54 out0 = DG_FMA( lambda, tmp0, temp);
58struct InverseTensorMultiply2d
60 template<
class VL,
class V0,
class V1,
class V2,
class VM,
class V3,
class V4>
62 void operator() ( VL lambda, V0 t00, V0 t01, V0 t10, V0 t11,
63 V1 in0, V2 in1, VM mu, V3& out0, V4& out1)
const
65 auto dett = DG_FMA( t00,t11 , (-t10*t01));
66 auto tmp0 = DG_FMA( in0,t11 , (-in1*t01));
67 auto tmp1 = DG_FMA( t00,in1 , (-t10*in0));
69 out1 = DG_FMA( lambda, tmp1/dett, temp);
71 out0 = DG_FMA( lambda, tmp0/dett, temp);
75struct InverseTensorMultiply3d
77 template<
class VL,
class V0,
class V1,
class V2,
class V3,
class VM,
class V4,
class V5,
class V6>
79 void operator() ( VL lambda,
80 V0 t00, V0 t01, V0 t02,
81 V0 t10, V0 t11, V0 t12,
82 V0 t20, V0 t21, V0 t22,
83 V1 in0, V2 in1, V3 in2,
85 V4& out0, V5& out1, V6& out2)
const
87 auto dett = t00*DG_FMA(t11, t22, (-t12*t21))
88 -t01*DG_FMA(t10, t22, (-t20*t12))
89 +t02*DG_FMA(t10, t21, (-t20*t11));
91 auto tmp0 = in0*DG_FMA(t11, t22, (-t12*t21))
92 -t01*DG_FMA(in1, t22, (-in2*t12))
93 +t02*DG_FMA(in1, t21, (-in2*t11));
94 auto tmp1 = t00*DG_FMA(in1, t22, (-t12*in2))
95 -in0*DG_FMA(t10, t22, (-t20*t12))
96 +t02*DG_FMA(t10, in2, (-t20*in1));
97 auto tmp2 = t00*DG_FMA(t11, in2, (-in1*t21))
98 -t01*DG_FMA(t10, in2, (-t20*in1))
99 +in0*DG_FMA(t10, t21, (-t20*t11));
101 out2 = DG_FMA( lambda, tmp2/dett, temp);
103 out1 = DG_FMA( lambda, tmp1/dett, temp);
105 out0 = DG_FMA( lambda, tmp0/dett, temp);
109struct TensorDeterminant2d
111 template<
class value_type>
113 value_type operator() ( value_type t00, value_type t01,
114 value_type t10, value_type t11)
const
116 return DG_FMA( t00,t11 , (-t10*t01));
120struct TensorDeterminant3d
122 template<
class value_type>
124 value_type operator() ( value_type t00, value_type t01, value_type t02,
125 value_type t10, value_type t11, value_type t12,
126 value_type t20, value_type t21, value_type t22)
const
128 return t00* DG_FMA( t11,t22 , (-t21*t12))
129 -t01* DG_FMA( t10,t22 , (-t20*t12))
130 +t02* DG_FMA( t10,t21 , (-t20*t11));
137 template<
class VL,
class V0,
class V1,
class V2,
class VM,
class V3,
class V4>
140 VL lambda, V0 v0, V1 v1,
146 auto tmp0 = DG_FMA(t00,w0 , t01*w1);
147 auto tmp1 = DG_FMA(t10,w0 , t11*w1);
148 return lambda*mu*DG_FMA(v0,tmp0 , v1*tmp1);
154 template<
class VL,
class V0,
class V1,
class V2,
class V3,
class VM,
class V4,
class V5,
class V6>
159 V3 t00, V3 t01, V3 t02,
160 V3 t10, V3 t11, V3 t12,
161 V3 t20, V3 t21, V3 t22,
163 V4 w0, V5 w1, V6 w2)
const
165 auto tmp0 = DG_FMA( t00,w0 , (DG_FMA( t01,w1 , t02*w2)));
166 auto tmp1 = DG_FMA( t10,w0 , (DG_FMA( t11,w1 , t12*w2)));
167 auto tmp2 = DG_FMA( t20,w0 , (DG_FMA( t21,w1 , t22*w2)));
168 return lambda*mu*DG_FMA(v0,tmp0 , DG_FMA(v1,tmp1 , v2*tmp2));
191template<
class ContainerType0,
class ContainerType1>
194 unsigned size=t.
values().size();
195 for(
unsigned i=0; i<size; i++)
214template<
class ContainerTypeL,
class ContainerType0,
class ContainerType1,
class ContainerType2,
class ContainerTypeM,
class ContainerType3,
class ContainerType4>
215void multiply2d(
const ContainerTypeL& lambda,
const SparseTensor<ContainerType0>& t,
const ContainerType1& in0,
const ContainerType2& in1,
const ContainerTypeM& mu, ContainerType3& out0, ContainerType4& out1)
220 in0, in1, mu, out0, out1);
239template<
class ContainerTypeL,
class ContainerType0,
class ContainerType1,
class ContainerType2,
class ContainerType3,
class ContainerTypeM,
class ContainerType4,
class ContainerType5,
class ContainerType6>
240void multiply3d(
const ContainerTypeL& lambda,
const SparseTensor<ContainerType0>& t,
const ContainerType1& in0,
const ContainerType2& in1,
const ContainerType3& in2,
const ContainerTypeM& mu, ContainerType4& out0, ContainerType5& out1, ContainerType6& out2)
247 mu, out0, out1, out2);
265template<
class ContainerTypeL,
class ContainerType0,
class ContainerType1,
class ContainerType2,
class ContainerTypeM,
class ContainerType3,
class ContainerType4>
271 in0, in1, mu, out0, out1);
291template<
class ContainerTypeL,
class ContainerType0,
class ContainerType1,
class ContainerType2,
class ContainerType3,
class ContainerTypeM,
class ContainerType4,
class ContainerType5,
class ContainerType6>
292void inv_multiply3d(
const ContainerTypeL& lambda,
const SparseTensor<ContainerType0>& t,
const ContainerType1& in0,
const ContainerType2& in1,
const ContainerType3& in2,
const ContainerTypeM& mu, ContainerType4& out0, ContainerType5& out1, ContainerType6& out2)
299 mu, out0, out1, out2);
311template<
class ContainerType>
314 ContainerType det = t.
value(0,0);
331template<
class ContainerType>
334 ContainerType det = t.
value(0,0);
361template<
class ContainerType>
388template<
class ContainerType>
410template<
class ContainerType0,
class ContainerType1,
class ContainerType2,
class ContainerType3,
class ContainerType4>
430template<
class ContainerType0,
class ContainerType1,
class ContainerType2,
class ContainerType3,
class ContainerType4,
class ContainerType5,
class ContainerType6>
431void multiply3d(
const SparseTensor<ContainerType0>& t,
const ContainerType1& in0,
const ContainerType2& in1,
const ContainerType3& in2, ContainerType4& out0, ContainerType5& out1, ContainerType6& out2)
433 multiply3d( 1., t, in0, in1, in2, 0., out0, out1, out2);
448template<
class ContainerType0,
class ContainerType1,
class ContainerType2,
class ContainerType3,
class ContainerType4>
469template<
class ContainerType0,
class ContainerType1,
class ContainerType2,
class ContainerType3,
class ContainerType4,
class ContainerType5,
class ContainerType6>
492template<
class ContainerTypeL,
class ContainerType0,
class ContainerType1,
class ContainerType2,
class ContainerType3,
class ContainerTypeM,
class ContainerType4,
class ContainerType5,
class value_type0,
class value_type1>
495 const ContainerTypeL& lambda,
496 const ContainerType0& v0,
497 const ContainerType1& v1,
499 const ContainerTypeM& mu,
500 const ContainerType3& w0,
501 const ContainerType4& w1,
506 dg::Axpby( alpha, beta),
532template<
class ContainerTypeL,
class ContainerType0,
class ContainerType1,
class ContainerType2,
class ContainerType3,
class ContainerTypeM,
class ContainerType4,
class ContainerType5,
class ContainerType6,
class ContainerType7,
class value_type0,
class value_type1>
535 const ContainerTypeL& lambda,
536 const ContainerType0& v0,
537 const ContainerType1& v1,
538 const ContainerType2& v2,
540 const ContainerTypeM& mu,
541 const ContainerType4& w0,
542 const ContainerType5& w1,
543 const ContainerType6& w2,
548 dg::Axpby( alpha, beta),
void pointwiseDot(value_type alpha, const ContainerType1 &x1, const ContainerType2 &x2, value_type1 beta, ContainerType &y)
Definition blas1.h:406
void transform(const ContainerType1 &x, ContainerType &y, UnaryOp op)
Definition blas1.h:585
void subroutine(Subroutine f, ContainerType &&x, ContainerTypes &&... xs)
; Customizable and generic blas1 function
Definition blas1.h:677
void evaluate(ContainerType &y, BinarySubroutine f, Functor g, const ContainerType0 &x0, const ContainerTypes &...xs)
Definition blas1.h:612
typename TensorTraits< std::decay_t< Vector > >::value_type get_value_type
Definition tensor_traits.h:45
void inv_multiply3d(const ContainerTypeL &lambda, const SparseTensor< ContainerType0 > &t, const ContainerType1 &in0, const ContainerType2 &in1, const ContainerType3 &in2, const ContainerTypeM &mu, ContainerType4 &out0, ContainerType5 &out1, ContainerType6 &out2)
i
Definition multiply.h:292
void scalar_product2d(value_type0 alpha, const ContainerTypeL &lambda, const ContainerType0 &v0, const ContainerType1 &v1, const SparseTensor< ContainerType2 > &t, const ContainerTypeM &mu, const ContainerType3 &w0, const ContainerType4 &w1, value_type1 beta, ContainerType5 &y)
Definition multiply.h:493
ContainerType determinant2d(const SparseTensor< ContainerType > &t)
Definition multiply.h:312
void inv_multiply2d(const ContainerTypeL &lambda, const SparseTensor< ContainerType0 > &t, const ContainerType1 &in0, const ContainerType2 &in1, const ContainerTypeM &mu, ContainerType3 &out0, ContainerType4 &out1)
Definition multiply.h:266
void scalar_product3d(value_type0 alpha, const ContainerTypeL &lambda, const ContainerType0 &v0, const ContainerType1 &v1, const ContainerType2 &v2, const SparseTensor< ContainerType3 > &t, const ContainerTypeM &mu, const ContainerType4 &w0, const ContainerType5 &w1, const ContainerType6 &w2, value_type1 beta, ContainerType7 &y)
Definition multiply.h:533
void multiply2d(const ContainerTypeL &lambda, const SparseTensor< ContainerType0 > &t, const ContainerType1 &in0, const ContainerType2 &in1, const ContainerTypeM &mu, ContainerType3 &out0, ContainerType4 &out1)
Definition multiply.h:215
ContainerType determinant(const SparseTensor< ContainerType > &t)
Definition multiply.h:332
ContainerType volume(const SparseTensor< ContainerType > &t)
Definition multiply.h:389
void multiply3d(const ContainerTypeL &lambda, const SparseTensor< ContainerType0 > &t, const ContainerType1 &in0, const ContainerType2 &in1, const ContainerType3 &in2, const ContainerTypeM &mu, ContainerType4 &out0, ContainerType5 &out1, ContainerType6 &out2)
Definition multiply.h:240
void scal(SparseTensor< ContainerType0 > &t, const ContainerType1 &mu)
Definition multiply.h:192
ContainerType volume2d(const SparseTensor< ContainerType > &t)
Definition multiply.h:362
#define DG_DEVICE
Expands to __host__ __device__ if compiled with nvcc else is empty.
Definition dg_doc.h:378
This is the namespace for all functions and classes defined and used by the discontinuous Galerkin li...
Class for 2x2 and 3x3 matrices sharing elements.
Definition tensor.h:51
std::vector< container > & values()
Return write access to the values array.
Definition tensor.h:151
const container & value(size_t i, size_t j) const
Read access the underlying container.
Definition tensor.h:141
Definition subroutines.h:22