Discontinuous Galerkin Library
#include "dg/algorithm.h"
Loading...
Searching...
No Matches
fma.h
Go to the documentation of this file.
1#pragma once
2
3#include <cmath>
4#include <complex>
5#include <thrust/complex.h>
6
7namespace dg
8{
10namespace detail
11{
12// Making T0, T1, T2 different fixes problem that any of them may be const reference types
13// overload A in std::fma
14// for cuda all types must be equal?
15template<class T0, class T1, class T2, class = std::enable_if_t<std::is_floating_point_v<T2> >>
17auto dg_fma( T0 x, T1 y, T2 z)
18{
19 return fma( (T2)x, (T2)y, z);
20}
21template<class T0, class T, class = std::enable_if_t<std::is_floating_point_v<T> >>
22std::complex<T> dg_fma( T0 x, std::complex<T> y, std::complex<T> z)
23{
24 return {
25 std::fma( (T)x, y.real(), z.real()),
26 std::fma( (T)x, y.imag(), z.imag())
27 };
28}
29template<class T, class = std::enable_if_t<std::is_floating_point_v<T> >>
30std::complex<T> dg_fma( std::complex<T> x, std::complex<T> y, std::complex<T> z)
31{
32 std::complex<T> out = {
33 std::fma( x.real(), y.real(), z.real()),
34 std::fma( x.real(), y.imag(), z.imag())
35 };
36 return {
37 std::fma( -x.imag(), y.imag(), out.real()),
38 std::fma( x.imag(), y.real(), out.imag())
39 };
40}
41template<class T0, class T, class = std::enable_if_t<std::is_floating_point_v<T> >>
43thrust::complex<T> dg_fma( T0 x, thrust::complex<T> y, thrust::complex<T> z)
44{
45 return {
46 fma( (T)x, y.real(), z.real()),
47 fma( (T)x, y.imag(), z.imag())
48 };
49}
50template<class T, class = std::enable_if_t<std::is_floating_point_v<T> >>
52thrust::complex<T> dg_fma( thrust::complex<T> x, thrust::complex<T> y, thrust::complex<T> z)
53{
54 thrust::complex<T> out = {
55 fma( x.real(), y.real(), z.real()),
56 fma( x.real(), y.imag(), z.imag())
57 };
58 return {
59 fma( -x.imag(), y.imag(), out.real()),
60 fma( x.imag(), y.real(), out.imag())
61 };
62}
63
64
65} // namespace detail
67} // namespace dg
@ z
z direction
@ y
y direction
@ x
x direction
#define DG_DEVICE
Expands to __host__ __device__ if compiled with nvcc else is empty.
Definition dg_doc.h:378
This is the namespace for all functions and classes defined and used by the discontinuous Galerkin li...