Discontinuous Galerkin Library
#include "dg/algorithm.h"
Loading...
Searching...
No Matches
blas1.h
Go to the documentation of this file.
1#pragma once
2
3#include "backend/predicate.h"
8#include "backend/blas1_dispatch_scalar.h"
9#include "backend/blas1_dispatch_shared.h"
10#ifdef MPI_VERSION
11#include "backend/mpi_vector.h"
12#include "backend/blas1_dispatch_mpi.h"
13#endif
14#include "backend/blas1_dispatch_vector.h"
15#include "backend/blas1_dispatch_map.h"
16#include "subroutines.h"
17
23namespace dg{
24
33namespace blas1
34{
36template< class ContainerType, class BinarySubroutine, class Functor, class ContainerType0, class ...ContainerTypes>
37inline void evaluate( ContainerType& y, BinarySubroutine f, Functor g, const ContainerType0& x0, const ContainerTypes& ...xs);
39
42
89template<class Functor, class ContainerType, class ...ContainerTypes>
90auto vdot( Functor f, const ContainerType& x, const ContainerTypes& ...xs) ->
91 std::invoke_result_t<Functor, dg::get_value_type<ContainerType>, dg::get_value_type<ContainerTypes>...>
92{
93 // The reason it is called vdot and not dot is because of the amgiuity when vdot is called
94 // with two arguments
95 using T = std::invoke_result_t<Functor, dg::get_value_type<ContainerType>, dg::get_value_type<ContainerTypes>...>;
96
97 int status = 0;
98 if constexpr( std::is_integral_v<T>) // e.g. T = int
99 {
100 std::array<T, 1> fpe;
101 dg::blas1::detail::doDot_fpe( &status, fpe, f, x, xs ...);
102 if( fpe[0] - fpe[0] != T(0))
104 <<"dg::blas1::vdot (integral type) failed "
105 <<"since one of the inputs contains NaN or Inf");
106 return fpe[0];
107 }
108 else
109 {
110 constexpr size_t N = 3;
111 std::array<T, N> fpe;
112 dg::blas1::detail::doDot_fpe( &status, fpe, f, x, xs ...);
113 for( unsigned u=0; u<N; u++)
114 {
115 if( fpe[u] - fpe[u] != T(0))
117 <<"dg::blas1::vdot (floating type) failed "
118 <<"since one of the inputs contains NaN or Inf");
119 }
120 return exblas::cpu::Round(fpe);
121 }
122}
123
152template< class ContainerType1, class ContainerType2>
153inline auto dot( const ContainerType1& x, const ContainerType2& y)
154{
155 if constexpr (std::is_floating_point_v<get_value_type<ContainerType1>> &&
156 std::is_floating_point_v<get_value_type<ContainerType2>>)
157 {
158 int status = 0;
159 std::vector<int64_t> acc = dg::blas1::detail::doDot_superacc( &status,
160 x,y);
161 if( status != 0)
162 throw dg::Error(dg::Message(_ping_)<<"dg::blas1::dot failed "
163 <<"since one of the inputs contains NaN or Inf");
164 return exblas::cpu::Round(acc.data());
165 }
166 else
167 {
168 return dg::blas1::vdot( dg::Product(), x, y);
169 }
170}
171
172
213template< class ContainerType, class OutputType, class BinaryOp, class UnaryOp
214 = IDENTITY>
215inline OutputType reduce( const ContainerType& x, OutputType zero, BinaryOp
216 binary_op, UnaryOp unary_op = UnaryOp())
217{
218 //init must indeed have the same type as the values of Container since op must be associative
219 // The generalization would be a transform_reduce combining subroutine and reduce
220 return dg::blas1::detail::doReduce(
222 unary_op);
223}
224
242template<class ContainerTypeIn, class ContainerTypeOut>
243inline void copy( const ContainerTypeIn& source, ContainerTypeOut& target){
244 if( std::is_same_v<ContainerTypeIn, ContainerTypeOut> && &source==(const ContainerTypeIn*)&target)
245 return;
246 dg::blas1::subroutine( dg::equals(), source, target);
247}
248
262template< class ContainerType, class value_type>
263inline void scal( ContainerType& x, value_type alpha)
264{
265 if( alpha == value_type(1))
266 return;
267 dg::blas1::subroutine( dg::Scal<value_type>(alpha), x );
268}
269
283template< class ContainerType, class value_type>
284inline void plus( ContainerType& x, value_type alpha)
285{
286 if( alpha == value_type(0))
287 return;
288 dg::blas1::subroutine( dg::Plus(alpha), x );
289}
290
305template< class ContainerType, class ContainerType1, class value_type, class value_type1>
306inline void axpby( value_type alpha, const ContainerType1& x, value_type1 beta, ContainerType& y)
307{
308 if( alpha == value_type(0) ) {
309 scal( y, beta);
310 return;
311 }
312 if( std::is_same_v<ContainerType, ContainerType1> && &x==(const ContainerType1*)&y){
313 dg::blas1::scal( y, (alpha+beta));
314 return;
315 }
316 dg::blas1::subroutine( dg::Axpby(alpha, beta), x, y);
317}
318
336template< class ContainerType, class ContainerType1, class ContainerType2, class value_type, class value_type1, class value_type2>
337inline void axpbypgz( value_type alpha, const ContainerType1& x, value_type1 beta, const ContainerType2& y, value_type2 gamma, ContainerType& z)
338{
339 if( alpha == value_type(0) )
340 {
341 axpby( beta, y, gamma, z);
342 return;
343 }
344 else if( beta == value_type1(0) )
345 {
346 axpby( alpha, x, gamma, z);
347 return;
348 }
349 if( std::is_same_v<ContainerType1, ContainerType2> && &x==(const ContainerType1*)&y){
350 dg::blas1::axpby( alpha+beta, x, gamma, z);
351 return;
352 }
353 else if( std::is_same_v<ContainerType1, ContainerType> && &x==(const ContainerType1*)&z){
354 dg::blas1::axpby( beta, y, alpha+gamma, z);
355 return;
356 }
357 else if( std::is_same_v<ContainerType2, ContainerType> && &y==(const ContainerType2*)&z){
358 dg::blas1::axpby( alpha, x, beta+gamma, z);
359 return;
360 }
361 dg::blas1::subroutine( dg::Axpbypgz(alpha, beta, gamma), x, y, z);
362}
363
381template< class ContainerType, class ContainerType1, class ContainerType2, class value_type, class value_type1>
382inline void axpby( value_type alpha, const ContainerType1& x, value_type1 beta, const ContainerType2& y, ContainerType& z)
383{
384 dg::blas1::evaluate( z , dg::equals(), dg::PairSum(), alpha, x, beta, y);
385}
386
405template< class ContainerType, class ContainerType1, class ContainerType2, class value_type, class value_type1>
406inline void pointwiseDot( value_type alpha, const ContainerType1& x1, const ContainerType2& x2, value_type1 beta, ContainerType& y)
407{
408 if( alpha == value_type(0) ) {
409 dg::blas1::scal(y, beta);
410 return;
411 }
412 //not sure this is necessary performance-wise, subroutine does allow aliases
413 if( std::is_same_v<ContainerType, ContainerType1> && &x1==(const ContainerType1*)&y){
414 dg::blas1::subroutine( dg::AxyPby(alpha,beta), x2, y );
415
416 return;
417 }
418 if( std::is_same_v<ContainerType, ContainerType2> && &x2==(const ContainerType2*)&y){
419 dg::blas1::subroutine( dg::AxyPby(alpha,beta), x1, y );
420
421 return;
422 }
423 dg::blas1::subroutine( dg::PointwiseDot(alpha,beta), x1, x2, y );
424}
425
440template< class ContainerType, class ContainerType1, class ContainerType2>
441inline void pointwiseDot( const ContainerType1& x1, const ContainerType2& x2, ContainerType& y)
442{
444}
445
465template< class ContainerType, class ContainerType1, class ContainerType2, class ContainerType3, class value_type, class value_type1>
466inline void pointwiseDot( value_type alpha, const ContainerType1& x1, const ContainerType2& x2, const ContainerType3& x3, value_type1 beta, ContainerType& y)
467{
468 if( alpha == value_type(0) ) {
469 dg::blas1::scal(y, beta);
470 return;
471 }
472 dg::blas1::subroutine( dg::PointwiseDot(alpha,beta), x1, x2, x3, y );
473}
474
494template< class ContainerType, class ContainerType1, class ContainerType2, class value_type, class value_type1>
495inline void pointwiseDivide( value_type alpha, const ContainerType1& x1, const ContainerType2& x2, value_type1 beta, ContainerType& y)
496{
497 if( alpha == value_type(0) ) {
498 dg::blas1::scal(y, beta);
499 return;
500 }
501 if( std::is_same_v<ContainerType, ContainerType1> && &x1==(const ContainerType1*)&y){
502 dg::blas1::subroutine( dg::PointwiseDivide(alpha,beta), x2, y );
503
504 return;
505 }
506 dg::blas1::subroutine( dg::PointwiseDivide(alpha, beta), x1, x2, y );
507}
508
524template< class ContainerType, class ContainerType1, class ContainerType2>
525inline void pointwiseDivide( const ContainerType1& x1, const ContainerType2& x2, ContainerType& y)
526{
527 dg::blas1::evaluate( y, dg::equals(), dg::divides(), x1, x2);
528}
529
552template<class ContainerType, class ContainerType1, class ContainerType2, class ContainerType3, class ContainerType4, class value_type, class value_type1, class value_type2>
553void pointwiseDot( value_type alpha, const ContainerType1& x1, const ContainerType2& y1,
554 value_type1 beta, const ContainerType3& x2, const ContainerType4& y2,
555 value_type2 gamma, ContainerType & z)
556{
557 if( alpha==value_type(0)){
558 pointwiseDot( beta, x2,y2, gamma, z);
559 return;
560 }
561 else if( beta==value_type1(0)){
562 pointwiseDot( alpha, x1,y1, gamma, z);
563 return;
564 }
565 dg::blas1::subroutine( dg::PointwiseDot2(alpha, beta, gamma), x1, y1, x2, y2, z );
566}
567
584template< class ContainerType, class ContainerType1, class UnaryOp>
585inline void transform( const ContainerType1& x, ContainerType& y, UnaryOp op )
586{
587 dg::blas1::subroutine( dg::Evaluate<dg::equals, UnaryOp>(dg::equals(),op), y, x);
588}
589
611template< class ContainerType, class BinarySubroutine, class Functor, class ContainerType0, class ...ContainerTypes>
612inline void evaluate( ContainerType& y, BinarySubroutine f, Functor g, const ContainerType0& x0, const ContainerTypes& ...xs)
613{
614 dg::blas1::subroutine( dg::Evaluate<BinarySubroutine, Functor>(f,g), y, x0, xs...);
615}
616
617
619namespace detail{
620
621template< class T, size_t N, class Functor, class ContainerType, class ...ContainerTypes>
622inline void doDot_fpe( int* status, std::array<T,N>& fpe, Functor f,
623 const ContainerType& x, const ContainerTypes& ...xs)
624{
625 static_assert( ( dg::is_vector_v<ContainerType> && ...
627 "All container types must have a vector data layout (AnyVector)!");
628 using vector_type = find_if_t<dg::is_not_scalar, ContainerType, ContainerType, ContainerTypes...>;
629 using tensor_category = get_tensor_category<vector_type>;
630 static_assert( ( dg::is_scalar_or_same_base_category<ContainerType, tensor_category>::value &&
631 ... && dg::is_scalar_or_same_base_category<ContainerTypes, tensor_category>::value),
632 "All container types must be either Scalar or have compatible Vector categories (AnyVector or Same base class)!");
633 return doDot_fpe( tensor_category(), status, fpe, f, x, xs ...);
634
635}
636
637template< class ContainerType1, class ContainerType2>
638inline std::vector<int64_t> doDot_superacc( int * status, const ContainerType1& x, const ContainerType2& y)
639{
641 "All container types must have a vector data layout (AnyVector)!");
642 using vector_type = find_if_t<dg::is_not_scalar, ContainerType1, ContainerType1, ContainerType2>;
643 using tensor_category = get_tensor_category<vector_type>;
644 static_assert( ( dg::is_scalar_or_same_base_category<ContainerType1, tensor_category>::value
645 && dg::is_scalar_or_same_base_category<ContainerType2, tensor_category>::value),
646 "All container types must be either Scalar or have compatible Vector categories (AnyVector or Same base class)!");
647 return doDot_superacc( status, x, y, tensor_category());
648}
649
650}//namespace detail
652
676template< class Subroutine, class ContainerType, class ...ContainerTypes>
677inline void subroutine( Subroutine f, ContainerType&& x, ContainerTypes&&... xs)
678{
679 static_assert( ( dg::is_vector_v<ContainerType> &&
681 "All container types must have a vector data layout (AnyVector)!");
682 using vector_type = find_if_t<dg::is_not_scalar, ContainerType, ContainerType, ContainerTypes...>;
683 using tensor_category = get_tensor_category<vector_type>;
684 static_assert( ( dg::is_scalar_or_same_base_category<ContainerType, tensor_category>::value &&
685 ... && dg::is_scalar_or_same_base_category<ContainerTypes, tensor_category>::value),
686 "All container types must be either Scalar or have compatible Vector categories (AnyVector or Same base class)!");
687 dg::blas1::detail::doSubroutine(tensor_category(), f, std::forward<ContainerType>(x), std::forward<ContainerTypes>(xs)...);
688}
689
726template< class ContainerType0, class BinarySubroutine, class Functor, class ContainerType1, class ...ContainerTypes>
727inline void kronecker( ContainerType0& y, BinarySubroutine f, Functor g, const ContainerType1& x0, const ContainerTypes& ...xs)
728{
729 static_assert( ( (dg::is_vector_v<ContainerType0> &&
732 "All container types must have a vector data layout (AnyVector)!");
733 using vector_type = find_if_t<dg::is_not_scalar, ContainerType1, ContainerType1, ContainerTypes...>;
734 using tensor_category = get_tensor_category<vector_type>;
735 static_assert( (
736 (dg::is_scalar_or_same_base_category<ContainerType0, tensor_category>::value &&
737 dg::is_scalar_or_same_base_category<ContainerType1, tensor_category>::value) &&
738 ... && dg::is_scalar_or_same_base_category<ContainerTypes, tensor_category>::value),
739 "All container types must be either Scalar or have compatible Vector categories (AnyVector or Same base class)!");
740 dg::blas1::detail::doKronecker(tensor_category(), y, f, g, x0, xs...);
741}
742
744}//namespace blas1
745
766template<class from_ContainerType, class ContainerType, class ...Params>
767inline void assign( const from_ContainerType& from, ContainerType& to, Params&& ... ps)
768{
769 dg::detail::doAssign<from_ContainerType, ContainerType, Params...>( from, to, get_tensor_category<from_ContainerType>(), get_tensor_category<ContainerType>(), std::forward<Params>(ps)...);
770}
771
791template<class ContainerType, class from_ContainerType, class ...Params>
792inline ContainerType construct( const from_ContainerType& from, Params&& ... ps)
793{
794 return dg::detail::doConstruct<ContainerType, from_ContainerType, Params...>( from, get_tensor_category<ContainerType>(), get_tensor_category<from_ContainerType>(), std::forward<Params>(ps)...);
795}
796
856template<class ContainerType, class Functor, class ...ContainerTypes>
857auto kronecker( Functor&& f, const ContainerType& x0, const ContainerTypes& ... xs)
858{
859 using tensor_category = get_tensor_category<ContainerType>;
860 return dg::detail::doKronecker( tensor_category(), std::forward<Functor>(f), x0, xs...);
861}
862
863
864} //namespace dg
865
class intended for the use in throw statements
Definition exceptions.h:83
small class holding a stringstream
Definition exceptions.h:29
#define _ping_
Definition exceptions.h:12
DG_DEVICE T zero(T x, Ts ...xs)
This enum can be used in dg::evaluate.
Definition functions.h:19
auto kronecker(Functor &&f, const ContainerType &x0, const ContainerTypes &... xs)
Memory allocating version of dg::blas1::kronecker
Definition blas1.h:857
void copy(const ContainerTypeIn &source, ContainerTypeOut &target)
Definition blas1.h:243
void axpbypgz(value_type alpha, const ContainerType1 &x, value_type1 beta, const ContainerType2 &y, value_type2 gamma, ContainerType &z)
Definition blas1.h:337
void axpby(value_type alpha, const ContainerType1 &x, value_type1 beta, ContainerType &y)
Definition blas1.h:306
void pointwiseDot(value_type alpha, const ContainerType1 &x1, const ContainerType2 &x2, value_type1 beta, ContainerType &y)
Definition blas1.h:406
auto vdot(Functor f, const ContainerType &x, const ContainerTypes &...xs) -> std::invoke_result_t< Functor, dg::get_value_type< ContainerType >, dg::get_value_type< ContainerTypes >... >
Extended Precision transform reduce
Definition blas1.h:90
void transform(const ContainerType1 &x, ContainerType &y, UnaryOp op)
Definition blas1.h:585
void plus(ContainerType &x, value_type alpha)
Definition blas1.h:284
ContainerType construct(const from_ContainerType &from, Params &&... ps)
Generic way to construct an object of ContainerType given a from_ContainerType object and optional ad...
Definition blas1.h:792
OutputType reduce(const ContainerType &x, OutputType zero, BinaryOp binary_op, UnaryOp unary_op=UnaryOp())
Custom (transform) reduction
Definition blas1.h:215
void subroutine(Subroutine f, ContainerType &&x, ContainerTypes &&... xs)
; Customizable and generic blas1 function
Definition blas1.h:677
auto dot(const ContainerType1 &x, const ContainerType2 &y)
Binary reproducible Euclidean dot product between two vectors
Definition blas1.h:153
void evaluate(ContainerType &y, BinarySubroutine f, Functor g, const ContainerType0 &x0, const ContainerTypes &...xs)
Definition blas1.h:612
void assign(const from_ContainerType &from, ContainerType &to, Params &&... ps)
Generic way to assign the contents of a from_ContainerType object to a ContainerType object optionall...
Definition blas1.h:767
void scal(ContainerType &x, value_type alpha)
Definition blas1.h:263
void kronecker(ContainerType0 &y, BinarySubroutine f, Functor g, const ContainerType1 &x0, const ContainerTypes &...xs)
(Kronecker evaluation)
Definition blas1.h:727
void pointwiseDivide(value_type alpha, const ContainerType1 &x1, const ContainerType2 &x2, value_type1 beta, ContainerType &y)
Definition blas1.h:495
@ z
z direction
@ y
y direction
@ x
x direction
typename TensorTraits< std::decay_t< Vector > >::tensor_category get_tensor_category
Definition tensor_traits.h:47
constexpr bool is_vector_v
Utility typedef.
Definition predicate.h:75
typename TensorTraits< std::decay_t< Vector > >::value_type get_value_type
Definition tensor_traits.h:45
to
Switch for the Timeloop integrate function.
Definition ode.h:17
double Round(int64_t *accumulator)
This is the namespace for all functions and classes defined and used by the discontinuous Galerkin li...
Definition subroutines.h:11
Definition subroutines.h:124
Definition subroutines.h:100
Definition subroutines.h:22