8#include "backend/blas1_dispatch_scalar.h"
9#include "backend/blas1_dispatch_shared.h"
12#include "backend/blas1_dispatch_mpi.h"
14#include "backend/blas1_dispatch_vector.h"
15#include "backend/blas1_dispatch_map.h"
36template<
class ContainerType,
class BinarySubroutine,
class Functor,
class ContainerType0,
class ...ContainerTypes>
37inline void evaluate( ContainerType&
y, BinarySubroutine f, Functor g,
const ContainerType0& x0,
const ContainerTypes& ...xs);
89template<
class Functor,
class ContainerType,
class ...ContainerTypes>
90auto vdot( Functor f,
const ContainerType& x,
const ContainerTypes& ...xs) ->
98 if constexpr( std::is_integral_v<T>)
100 std::array<T, 1> fpe;
101 dg::blas1::detail::doDot_fpe( &status, fpe, f,
x, xs ...);
102 if( fpe[0] - fpe[0] != T(0))
104 <<
"dg::blas1::vdot (integral type) failed "
105 <<
"since one of the inputs contains NaN or Inf");
110 constexpr size_t N = 3;
111 std::array<T, N> fpe;
112 dg::blas1::detail::doDot_fpe( &status, fpe, f,
x, xs ...);
113 for(
unsigned u=0; u<N; u++)
115 if( fpe[u] - fpe[u] != T(0))
117 <<
"dg::blas1::vdot (floating type) failed "
118 <<
"since one of the inputs contains NaN or Inf");
152template<
class ContainerType1,
class ContainerType2>
153inline auto dot(
const ContainerType1& x,
const ContainerType2&
y)
155 if constexpr (std::is_floating_point_v<get_value_type<ContainerType1>> &&
156 std::is_floating_point_v<get_value_type<ContainerType2>>)
159 std::vector<int64_t> acc = dg::blas1::detail::doDot_superacc( &status,
163 <<
"since one of the inputs contains NaN or Inf");
213template<
class ContainerType,
class OutputType,
class BinaryOp,
class UnaryOp
215inline OutputType
reduce(
const ContainerType& x, OutputType
zero, BinaryOp
216 binary_op, UnaryOp unary_op = UnaryOp())
220 return dg::blas1::detail::doReduce(
242template<
class ContainerTypeIn,
class ContainerTypeOut>
243inline void copy(
const ContainerTypeIn& source, ContainerTypeOut& target){
244 if( std::is_same_v<ContainerTypeIn, ContainerTypeOut> && &source==(
const ContainerTypeIn*)&target)
262template<
class ContainerType,
class value_type>
263inline void scal( ContainerType& x, value_type alpha)
265 if( alpha == value_type(1))
283template<
class ContainerType,
class value_type>
284inline void plus( ContainerType& x, value_type alpha)
286 if( alpha == value_type(0))
305template<
class ContainerType,
class ContainerType1,
class value_type,
class value_type1>
306inline void axpby( value_type alpha,
const ContainerType1& x, value_type1 beta, ContainerType&
y)
308 if( alpha == value_type(0) ) {
312 if( std::is_same_v<ContainerType, ContainerType1> && &
x==(
const ContainerType1*)&
y){
336template<
class ContainerType,
class ContainerType1,
class ContainerType2,
class value_type,
class value_type1,
class value_type2>
337inline void axpbypgz( value_type alpha,
const ContainerType1& x, value_type1 beta,
const ContainerType2&
y, value_type2 gamma, ContainerType&
z)
339 if( alpha == value_type(0) )
344 else if( beta == value_type1(0) )
349 if( std::is_same_v<ContainerType1, ContainerType2> && &
x==(
const ContainerType1*)&
y){
353 else if( std::is_same_v<ContainerType1, ContainerType> && &
x==(
const ContainerType1*)&
z){
357 else if( std::is_same_v<ContainerType2, ContainerType> && &
y==(
const ContainerType2*)&
z){
381template<
class ContainerType,
class ContainerType1,
class ContainerType2,
class value_type,
class value_type1>
382inline void axpby( value_type alpha,
const ContainerType1& x, value_type1 beta,
const ContainerType2&
y, ContainerType&
z)
405template<
class ContainerType,
class ContainerType1,
class ContainerType2,
class value_type,
class value_type1>
406inline void pointwiseDot( value_type alpha,
const ContainerType1& x1,
const ContainerType2& x2, value_type1 beta, ContainerType&
y)
408 if( alpha == value_type(0) ) {
413 if( std::is_same_v<ContainerType, ContainerType1> && &x1==(
const ContainerType1*)&
y){
418 if( std::is_same_v<ContainerType, ContainerType2> && &x2==(
const ContainerType2*)&
y){
440template<
class ContainerType,
class ContainerType1,
class ContainerType2>
441inline void pointwiseDot(
const ContainerType1& x1,
const ContainerType2& x2, ContainerType&
y)
465template<
class ContainerType,
class ContainerType1,
class ContainerType2,
class ContainerType3,
class value_type,
class value_type1>
466inline void pointwiseDot( value_type alpha,
const ContainerType1& x1,
const ContainerType2& x2,
const ContainerType3& x3, value_type1 beta, ContainerType&
y)
468 if( alpha == value_type(0) ) {
494template<
class ContainerType,
class ContainerType1,
class ContainerType2,
class value_type,
class value_type1>
495inline void pointwiseDivide( value_type alpha,
const ContainerType1& x1,
const ContainerType2& x2, value_type1 beta, ContainerType&
y)
497 if( alpha == value_type(0) ) {
501 if( std::is_same_v<ContainerType, ContainerType1> && &x1==(
const ContainerType1*)&
y){
524template<
class ContainerType,
class ContainerType1,
class ContainerType2>
525inline void pointwiseDivide(
const ContainerType1& x1,
const ContainerType2& x2, ContainerType&
y)
552template<
class ContainerType,
class ContainerType1,
class ContainerType2,
class ContainerType3,
class ContainerType4,
class value_type,
class value_type1,
class value_type2>
553void pointwiseDot( value_type alpha,
const ContainerType1& x1,
const ContainerType2& y1,
554 value_type1 beta,
const ContainerType3& x2,
const ContainerType4& y2,
555 value_type2 gamma, ContainerType &
z)
557 if( alpha==value_type(0)){
561 else if( beta==value_type1(0)){
584template<
class ContainerType,
class ContainerType1,
class UnaryOp>
585inline void transform(
const ContainerType1& x, ContainerType&
y, UnaryOp op )
611template<
class ContainerType,
class BinarySubroutine,
class Functor,
class ContainerType0,
class ...ContainerTypes>
612inline void evaluate( ContainerType&
y, BinarySubroutine f, Functor g,
const ContainerType0& x0,
const ContainerTypes& ...xs)
621template<
class T,
size_t N,
class Functor,
class ContainerType,
class ...ContainerTypes>
622inline void doDot_fpe(
int* status, std::array<T,N>& fpe, Functor f,
623 const ContainerType& x,
const ContainerTypes& ...xs)
627 "All container types must have a vector data layout (AnyVector)!");
628 using vector_type = find_if_t<dg::is_not_scalar, ContainerType, ContainerType, ContainerTypes...>;
630 static_assert( ( dg::is_scalar_or_same_base_category<ContainerType, tensor_category>::value &&
631 ... && dg::is_scalar_or_same_base_category<ContainerTypes, tensor_category>::value),
632 "All container types must be either Scalar or have compatible Vector categories (AnyVector or Same base class)!");
633 return doDot_fpe( tensor_category(), status, fpe, f, x, xs ...);
637template<
class ContainerType1,
class ContainerType2>
638inline std::vector<int64_t> doDot_superacc(
int * status,
const ContainerType1& x,
const ContainerType2& y)
641 "All container types must have a vector data layout (AnyVector)!");
642 using vector_type = find_if_t<dg::is_not_scalar, ContainerType1, ContainerType1, ContainerType2>;
643 using tensor_category = get_tensor_category<vector_type>;
644 static_assert( ( dg::is_scalar_or_same_base_category<ContainerType1, tensor_category>::value
645 && dg::is_scalar_or_same_base_category<ContainerType2, tensor_category>::value),
646 "All container types must be either Scalar or have compatible Vector categories (AnyVector or Same base class)!");
647 return doDot_superacc( status, x, y, tensor_category());
676template<
class Subroutine,
class ContainerType,
class ...ContainerTypes>
677inline void subroutine( Subroutine f, ContainerType&& x, ContainerTypes&&... xs)
681 "All container types must have a vector data layout (AnyVector)!");
682 using vector_type = find_if_t<dg::is_not_scalar, ContainerType, ContainerType, ContainerTypes...>;
684 static_assert( ( dg::is_scalar_or_same_base_category<ContainerType, tensor_category>::value &&
685 ... && dg::is_scalar_or_same_base_category<ContainerTypes, tensor_category>::value),
686 "All container types must be either Scalar or have compatible Vector categories (AnyVector or Same base class)!");
687 dg::blas1::detail::doSubroutine(tensor_category(), f, std::forward<ContainerType>(
x), std::forward<ContainerTypes>(xs)...);
726template<
class ContainerType0,
class BinarySubroutine,
class Functor,
class ContainerType1,
class ...ContainerTypes>
727inline void kronecker( ContainerType0&
y, BinarySubroutine f, Functor g,
const ContainerType1& x0,
const ContainerTypes& ...xs)
732 "All container types must have a vector data layout (AnyVector)!");
733 using vector_type = find_if_t<dg::is_not_scalar, ContainerType1, ContainerType1, ContainerTypes...>;
736 (dg::is_scalar_or_same_base_category<ContainerType0, tensor_category>::value &&
737 dg::is_scalar_or_same_base_category<ContainerType1, tensor_category>::value) &&
738 ... && dg::is_scalar_or_same_base_category<ContainerTypes, tensor_category>::value),
739 "All container types must be either Scalar or have compatible Vector categories (AnyVector or Same base class)!");
740 dg::blas1::detail::doKronecker(tensor_category(),
y, f, g, x0, xs...);
766template<
class from_ContainerType,
class ContainerType,
class ...Params>
767inline void assign(
const from_ContainerType& from, ContainerType&
to, Params&& ... ps)
791template<
class ContainerType,
class from_ContainerType,
class ...Params>
792inline ContainerType
construct(
const from_ContainerType& from, Params&& ... ps)
856template<
class ContainerType,
class Functor,
class ...ContainerTypes>
857auto kronecker( Functor&& f,
const ContainerType& x0,
const ContainerTypes& ... xs)
860 return dg::detail::doKronecker( tensor_category(), std::forward<Functor>(f), x0, xs...);
class intended for the use in throw statements
Definition exceptions.h:83
small class holding a stringstream
Definition exceptions.h:29
#define _ping_
Definition exceptions.h:12
DG_DEVICE T zero(T x, Ts ...xs)
This enum can be used in dg::evaluate.
Definition functions.h:19
auto kronecker(Functor &&f, const ContainerType &x0, const ContainerTypes &... xs)
Memory allocating version of dg::blas1::kronecker
Definition blas1.h:857
void copy(const ContainerTypeIn &source, ContainerTypeOut &target)
Definition blas1.h:243
void axpbypgz(value_type alpha, const ContainerType1 &x, value_type1 beta, const ContainerType2 &y, value_type2 gamma, ContainerType &z)
Definition blas1.h:337
void axpby(value_type alpha, const ContainerType1 &x, value_type1 beta, ContainerType &y)
Definition blas1.h:306
void pointwiseDot(value_type alpha, const ContainerType1 &x1, const ContainerType2 &x2, value_type1 beta, ContainerType &y)
Definition blas1.h:406
auto vdot(Functor f, const ContainerType &x, const ContainerTypes &...xs) -> std::invoke_result_t< Functor, dg::get_value_type< ContainerType >, dg::get_value_type< ContainerTypes >... >
Extended Precision transform reduce
Definition blas1.h:90
void transform(const ContainerType1 &x, ContainerType &y, UnaryOp op)
Definition blas1.h:585
void plus(ContainerType &x, value_type alpha)
Definition blas1.h:284
ContainerType construct(const from_ContainerType &from, Params &&... ps)
Generic way to construct an object of ContainerType given a from_ContainerType object and optional ad...
Definition blas1.h:792
OutputType reduce(const ContainerType &x, OutputType zero, BinaryOp binary_op, UnaryOp unary_op=UnaryOp())
Custom (transform) reduction
Definition blas1.h:215
void subroutine(Subroutine f, ContainerType &&x, ContainerTypes &&... xs)
; Customizable and generic blas1 function
Definition blas1.h:677
auto dot(const ContainerType1 &x, const ContainerType2 &y)
Binary reproducible Euclidean dot product between two vectors
Definition blas1.h:153
void evaluate(ContainerType &y, BinarySubroutine f, Functor g, const ContainerType0 &x0, const ContainerTypes &...xs)
Definition blas1.h:612
void assign(const from_ContainerType &from, ContainerType &to, Params &&... ps)
Generic way to assign the contents of a from_ContainerType object to a ContainerType object optionall...
Definition blas1.h:767
void scal(ContainerType &x, value_type alpha)
Definition blas1.h:263
void kronecker(ContainerType0 &y, BinarySubroutine f, Functor g, const ContainerType1 &x0, const ContainerTypes &...xs)
(Kronecker evaluation)
Definition blas1.h:727
void pointwiseDivide(value_type alpha, const ContainerType1 &x1, const ContainerType2 &x2, value_type1 beta, ContainerType &y)
Definition blas1.h:495
typename TensorTraits< std::decay_t< Vector > >::tensor_category get_tensor_category
Definition tensor_traits.h:47
constexpr bool is_vector_v
Utility typedef.
Definition predicate.h:75
typename TensorTraits< std::decay_t< Vector > >::value_type get_value_type
Definition tensor_traits.h:45
to
Switch for the Timeloop integrate function.
Definition ode.h:17
double Round(int64_t *accumulator)
This is the namespace for all functions and classes defined and used by the discontinuous Galerkin li...
Definition subroutines.h:11
Definition subroutines.h:124
Definition subroutines.h:100
Definition subroutines.h:22