VCTR
Loading...
Searching...
No Matches
Abs.h
1/*
2 ==============================================================================
3 DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
4
5 Copyright 2022- by sonible GmbH.
6
7 This file is part of VCTR - Versatile Container Templates Reconceptualized.
8
9 VCTR is free software: you can redistribute it and/or modify
10 it under the terms of the GNU Lesser General Public License version 3
11 only, as published by the Free Software Foundation.
12
13 VCTR is distributed in the hope that it will be useful,
14 but WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 GNU Lesser General Public License version 3 for more details.
17
18 You should have received a copy of the GNU Lesser General Public License
19 version 3 along with VCTR. If not, see <https://www.gnu.org/licenses/>.
20 ==============================================================================
21*/
22
23namespace vctr::expressions
24{
25
26template <size_t extent, class SrcType>
28{
29public:
30 using value_type = RealType<ValueType<SrcType>>;
31
32 VCTR_COMMON_UNARY_EXPRESSION_MEMBERS (Abs, src)
33
34 VCTR_FORCEDINLINE constexpr value_type operator[] (size_t i) const
36 {
37 return std::abs (src[i]);
38 }
39
40 VCTR_FORCEDINLINE constexpr value_type operator[] (size_t i) const
42 {
43 return src[i];
44 }
45
46 // clang-format off
47 VCTR_FORCEDINLINE const value_type* evalNextVectorOpInExpressionChain (value_type* dst) const
48 requires is::suitableForAccelerateRealFloatVectorOp <SrcType, value_type, detail::dontPreferIfIppAndAccelerateAreAvailable> ||
50 // clang-format on
51 {
52 Expression::Accelerate::abs (src.evalNextVectorOpInExpressionChain (dst), dst, size());
53 return dst;
54 }
55
56 // clang-format off
57 VCTR_FORCEDINLINE const value_type* evalNextVectorOpInExpressionChain (value_type* dst) const
58 requires is::suitableForIppRealSingedInt32VectorOp <SrcType, value_type, detail::preferIfIppAndAccelerateAreAvailable> ||
59 is::suitableForIppRealFloatVectorOp <SrcType, value_type, detail::preferIfIppAndAccelerateAreAvailable> ||
61 // clang-format on
62 {
63 Expression::IPP::abs (src.evalNextVectorOpInExpressionChain (dst), dst, sizeToInt (size()));
64 return dst;
65 }
66
67 //==============================================================================
68 VCTR_FORWARD_PREPARE_SIMD_EVALUATION_UNARY_EXPRESSION_MEMBER_FUNCTIONS
69
70 NeonRegister<value_type> getNeon (size_t i) const
71 requires (archARM && has::getNeon<SrcType> && Expression::CommonElement::isSigned)
72 {
73 return Expression::Neon::abs (src.getNeon (i));
74 }
75
76 NeonRegister<value_type> getNeon (size_t i) const
77 requires (archARM && has::getNeon<SrcType> && ! Expression::CommonElement::isSigned)
78 {
79 return src.getNeon (i); // unsigned integers are always positive
80 }
81
82 // AVX Implementation
83 VCTR_FORCEDINLINE VCTR_TARGET ("fma") AVXRegister<value_type> getAVX (size_t i) const
84 requires (archX64 && has::getAVX<SrcType> && Expression::CommonElement::isRealFloat)
85 {
86 static const auto avxSignBit = Expression::AVX::broadcast (typename Expression::CommonElement::Type (-0.0));
87
88 return Expression::AVX::bitwiseAndNot (src.getAVX (i), avxSignBit);
89 }
90
91 VCTR_FORCEDINLINE VCTR_TARGET ("avx2") AVXRegister<value_type> getAVX (size_t i) const
92 requires (archX64 && has::getAVX<SrcType> && Expression::CommonElement::isInt32)
93 {
94 return Expression::AVX::abs (src.getAVX (i));
95 }
96
97 VCTR_FORCEDINLINE VCTR_TARGET ("avx2") AVXRegister<value_type> getAVX (size_t i) const
98 requires (archX64 && has::getAVX<SrcType> && Expression::CommonElement::isUnsigned)
99 {
100 return src.getAVX (i); // unsigned integers are always positive
101 }
102
103 // SSE Implementation
104 VCTR_FORCEDINLINE VCTR_TARGET ("sse4.1") SSERegister<value_type> getSSE (size_t i) const
105 requires (archX64 && has::getSSE<SrcType> && Expression::CommonElement::isRealFloat)
106 {
107 static const auto sseSignBit = Expression::SSE::broadcast (typename Expression::CommonElement::Type (-0.0));
108
109 return Expression::SSE::bitwiseAndNot (src.getSSE (i), sseSignBit);
110 }
111
112 VCTR_FORCEDINLINE VCTR_TARGET ("sse4.1") SSERegister<value_type> getSSE (size_t i) const
113 requires (archX64 && has::getSSE<SrcType> && Expression::CommonElement::isInt32)
114 {
115 return Expression::SSE::abs (src.getSSE (i));
116 }
117
118 VCTR_FORCEDINLINE VCTR_TARGET ("sse4.1") SSERegister<value_type> getSSE (size_t i) const
119 requires (archX64 && has::getSSE<SrcType> && Expression::CommonElement::isUnsigned)
120 {
121 return src.getSSE (i); // unsigned integers are always positive
122 }
123};
124
125} // namespace vctr::expressions
126
127namespace vctr
128{
136
137} // namespace vctr
Definition: Abs.h:28
Constrains a type to have a member function getAVX (size_t) const.
Definition: ContainerAndExpressionConcepts.h:92
Constrains a type to have a member function getNeon (size_t) const.
Definition: ContainerAndExpressionConcepts.h:84
Constrains a type to have a member function getSSE (size_t) const.
Definition: ContainerAndExpressionConcepts.h:100
Constrains a type to represent a real valued signed number (e.g.
Definition: NumericTypeConcepts.h:65
A combined concept to check if Apple Accelerate is a suitable option for a floating point vector oper...
Definition: ContainerAndExpressionConcepts.h:272
A combined concept to check if Intel IPP is a suitable option for a floating point vector operation t...
Definition: ContainerAndExpressionConcepts.h:300
Constrains a type to represent a real valued unsigned integer number.
Definition: NumericTypeConcepts.h:74
constexpr ExpressionChainBuilder< expressions::Abs > abs
Computes the absolute value of the source values.
Definition: Abs.h:135
The main namespace of the VCTR project.
Definition: Array.h:24
typename detail::RealType< std::remove_cvref_t< T > >::Type RealType
If T is any instance of std::complex, this will be the real value_type, otherwise this will be T.
Definition: Traits.h:211
int sizeToInt(size_t size)
Casts the size_t argument to an int.
Definition: PlatformVectorOpsHelpers.h:27
Definition: AVXRegister.h:28
An expression chain builder is an object which supplies various operator<< overloads which build chai...
Definition: ExpressionChainBuilder.h:157
The base class to every expression template.
Definition: ExpressionTemplate.h:37
Definition: NeonRegister.h:28
Definition: SSERegister.h:28