23namespace vctr::expressions
26template <
size_t extent,
class SrcType>
27requires is::number<ValueType<SrcType>>
33 VCTR_COMMON_UNARY_EXPRESSION_MEMBERS (
Mean, src)
35 static constexpr value_type reductionResultInitValue = 0;
37 VCTR_FORCEDINLINE
constexpr void reduceElementWise (value_type& result,
size_t i)
const
43 VCTR_FORCEDINLINE value_type reduceVectorOp()
const
46 return Expression::Accelerate::mean (src.data(), size());
49 VCTR_FORCEDINLINE value_type reduceVectorOp()
const
52 return Expression::IPP::mean (src.data(),
sizeToInt (size()));
56 VCTR_FORWARD_PREPARE_SIMD_EVALUATION_UNARY_EXPRESSION_MEMBER_FUNCTIONS
61 result = Expression::Neon::add (result, src.getNeon (i));
64 VCTR_FORCEDINLINE VCTR_TARGET (
"fma")
void reduceAVXRegisterWise (
AVXRegister<value_type>& result,
size_t i)
const
67 result = Expression::AVX::add (result, src.getAVX (i));
70 VCTR_FORCEDINLINE VCTR_TARGET (
"avx2")
void reduceAVXRegisterWise (
AVXRegister<value_type>& result,
size_t i)
const
73 result = Expression::AVX::add (result, src.getAVX (i));
76 VCTR_FORCEDINLINE VCTR_TARGET (
"sse4.1")
void reduceSSERegisterWise (
SSERegister<value_type>& result,
size_t i)
const
79 result = Expression::SSE::add (result, src.getSSE (i));
84 VCTR_FORCEDINLINE
constexpr value_type finalizeReduction (
const std::array<value_type, n>& sums)
const
86 auto sum = n == 1 ? sums[0] : std::reduce (sums.begin(), sums.end());
92template <
size_t extent,
class SrcType>
99 VCTR_COMMON_UNARY_EXPRESSION_MEMBERS (
MeanSquare, src)
101 static constexpr value_type reductionResultInitValue = 0;
103 VCTR_FORCEDINLINE
constexpr void reduceElementWise (value_type& result,
size_t i)
const
110 VCTR_FORCEDINLINE value_type reduceVectorOp()
const
113 return Expression::Accelerate::meanSquare (src.data(), size());
116 VCTR_FORCEDINLINE value_type reduceVectorOp()
const
119 auto l2Norm = Expression::IPP::l2Norm (src.data(),
sizeToInt (size()));
120 return (l2Norm * l2Norm) / value_type (size());
124 VCTR_FORWARD_PREPARE_SIMD_EVALUATION_UNARY_EXPRESSION_MEMBER_FUNCTIONS
129 auto s = src.getNeon (i);
130 s = Expression::Neon::mul (s, s);
131 result = Expression::Neon::add (result, s);
134 VCTR_FORCEDINLINE VCTR_TARGET (
"fma")
void reduceAVXRegisterWise (
AVXRegister<value_type>& result,
size_t i)
const
137 auto s = src.getAVX (i);
138 s = Expression::AVX::mul (s, s);
139 result = Expression::AVX::add (result, s);
142 VCTR_FORCEDINLINE VCTR_TARGET (
"sse4.1")
void reduceSSERegisterWise (
SSERegister<value_type>& result,
size_t i)
const
145 auto s = src.getSSE (i);
146 s = Expression::SSE::mul (s, s);
147 result = Expression::SSE::add (result, s);
152 VCTR_FORCEDINLINE
constexpr value_type finalizeReduction (
const std::array<value_type, n>& sums)
const
154 auto sum = n == 1 ? sums[0] : std::reduce (sums.begin(), sums.end());
160template <
size_t extent,
class SrcType>
169 static constexpr value_type reductionResultInitValue = 0;
171 VCTR_FORCEDINLINE
constexpr void reduceElementWise (value_type& result,
size_t i)
const
178 VCTR_FORCEDINLINE value_type reduceVectorOp()
const
181 return Expression::Accelerate::rms (src.data(), size());
184 VCTR_FORCEDINLINE value_type reduceVectorOp()
const
187 auto l2Norm = Expression::IPP::l2Norm (src.data(),
sizeToInt (size()));
188 return std::sqrt ((l2Norm * l2Norm) / value_type (size()));
192 VCTR_FORWARD_PREPARE_SIMD_EVALUATION_UNARY_EXPRESSION_MEMBER_FUNCTIONS
197 auto s = src.getNeon (i);
198 s = Expression::Neon::mul (s, s);
199 result = Expression::Neon::add (result, s);
202 VCTR_FORCEDINLINE VCTR_TARGET (
"fma")
void reduceAVXRegisterWise (
AVXRegister<value_type>& result,
size_t i)
const
205 auto s = src.getAVX (i);
206 s = Expression::AVX::mul (s, s);
207 result = Expression::AVX::add (result, s);
210 VCTR_FORCEDINLINE VCTR_TARGET (
"sse4.1")
void reduceSSERegisterWise (
SSERegister<value_type>& result,
size_t i)
const
213 auto s = src.getSSE (i);
214 s = Expression::SSE::mul (s, s);
215 result = Expression::SSE::add (result, s);
220 VCTR_FORCEDINLINE
constexpr value_type finalizeReduction (
const std::array<value_type, n>& squaredSums)
const
222 auto squaredSum = n == 1 ? squaredSums[0] : std::reduce (squaredSums.begin(), squaredSums.end());
228 if (std::is_constant_evaluated())
230 return value_type (gcem::sqrt (meanSquaredSum));
235 return value_type (std::sqrt (meanSquaredSum));
Constrains a type to have a member function getAVX (size_t) const.
Definition: ContainerAndExpressionConcepts.h:92
Constrains a type to have a member function getNeon (size_t) const.
Definition: ContainerAndExpressionConcepts.h:84
Constrains a type to have a member function getSSE (size_t) const.
Definition: ContainerAndExpressionConcepts.h:100
Constrains a type to represent a real valued 32 bit integer number.
Definition: NumericTypeConcepts.h:57
Constrains a type to represent a real valued or std::complex number type.
Definition: NumericTypeConcepts.h:49
Constrains a type to represent a real valued floating point number.
Definition: NumericTypeConcepts.h:83
Constrains a type to represent a real or complex valued floating point number.
Definition: NumericTypeConcepts.h:91
A combined concept to check if Apple Accelerate is a suitable option for a floating point vector redu...
Definition: ContainerAndExpressionConcepts.h:280
A combined concept to check if Intel IPP is a suitable option for a floating point vector reduction o...
Definition: ContainerAndExpressionConcepts.h:304
A combined concept to check if Intel IPP is a suitable option for a real or complex floating point ve...
Definition: ContainerAndExpressionConcepts.h:308
constexpr ExpressionChainBuilder< expressions::RootMeanSquare > rms
Computes the square root of the mean value of the squared source values.
Definition: Mean.h:260
constexpr ExpressionChainBuilder< expressions::Mean > mean
Computes the mean value of the source values.
Definition: Mean.h:248
constexpr ExpressionChainBuilder< expressions::Sum > sum
Computes the sum of the source values.
Definition: Sum.h:118
constexpr ExpressionChainBuilder< expressions::MeanSquare > meanSquare
Computes the mean value of the squared source values.
Definition: Mean.h:254
The main namespace of the VCTR project.
Definition: Array.h:24
typename detail::ValueType< std::remove_cvref_t< T > >::Type ValueType
If T is an expression template, it equals its return type, if it's a type that defines value_type as ...
Definition: Traits.h:201
typename detail::FloatType< std::remove_cvref_t< T > >::Type FloatType
The best matching float type for the real number type T.
Definition: Traits.h:219
typename detail::RealType< std::remove_cvref_t< T > >::Type RealType
If T is any instance of std::complex, this will be the real value_type, otherwise this will be T.
Definition: Traits.h:211
int sizeToInt(size_t size)
Casts the size_t argument to an int.
Definition: PlatformVectorOpsHelpers.h:27
Definition: AVXRegister.h:28
An expression chain builder is an object which supplies various operator<< overloads which build chai...
Definition: ExpressionChainBuilder.h:157
The base class to every expression template.
Definition: ExpressionTemplate.h:37
Definition: NeonRegister.h:28
Definition: SSERegister.h:28