TR-mbed 1.0
Loading...
Searching...
No Matches
Complex.h
Go to the documentation of this file.
1// This file is part of Eigen, a lightweight C++ template library
2// for linear algebra.
3//
4// Copyright (C) 2014 Benoit Steiner (benoit.steiner.goog@gmail.com)
5//
6// This Source Code Form is subject to the terms of the Mozilla
7// Public License v. 2.0. If a copy of the MPL was not distributed
8// with this file, You can obtain one at http://mozilla.org/MPL/2.0/.
9
10#ifndef EIGEN_COMPLEX_AVX_H
11#define EIGEN_COMPLEX_AVX_H
12
13namespace Eigen {
14
15namespace internal {
16
17//---------- float ----------
24
25#ifndef EIGEN_VECTORIZE_AVX512
26template<> struct packet_traits<std::complex<float> > : default_packet_traits
27{
28 typedef Packet4cf type;
29 typedef Packet2cf half;
30 enum {
31 Vectorizable = 1,
33 size = 4,
34 HasHalfPacket = 1,
35
36 HasAdd = 1,
37 HasSub = 1,
38 HasMul = 1,
39 HasDiv = 1,
40 HasNegate = 1,
42 HasAbs = 0,
43 HasAbs2 = 0,
44 HasMin = 0,
45 HasMax = 0,
46 HasSetLinear = 0
47 };
48};
49#endif
50
51template<> struct unpacket_traits<Packet4cf> {
52 typedef std::complex<float> type;
53 typedef Packet2cf half;
55 enum {
61 };
62};
63
67{
68 return Packet4cf(pnegate(a.v));
69}
71{
72 const __m256 mask = _mm256_castsi256_ps(_mm256_setr_epi32(0x00000000,0x80000000,0x00000000,0x80000000,0x00000000,0x80000000,0x00000000,0x80000000));
73 return Packet4cf(_mm256_xor_ps(a.v,mask));
74}
75
83
84template <>
89
95
98
99
100template<> EIGEN_STRONG_INLINE Packet4cf pset1<Packet4cf>(const std::complex<float>& from)
101{
102 return Packet4cf(_mm256_castpd_ps(_mm256_broadcast_sd((const double*)(const void*)&from)));
103}
104
105template<> EIGEN_STRONG_INLINE Packet4cf ploaddup<Packet4cf>(const std::complex<float>* from)
106{
107 // FIXME The following might be optimized using _mm256_movedup_pd
111}
112
115
116template<> EIGEN_DEVICE_FUNC inline Packet4cf pgather<std::complex<float>, Packet4cf>(const std::complex<float>* from, Index stride)
117{
118 return Packet4cf(_mm256_set_ps(std::imag(from[3*stride]), std::real(from[3*stride]),
119 std::imag(from[2*stride]), std::real(from[2*stride]),
120 std::imag(from[1*stride]), std::real(from[1*stride]),
121 std::imag(from[0*stride]), std::real(from[0*stride])));
122}
123
124template<> EIGEN_DEVICE_FUNC inline void pscatter<std::complex<float>, Packet4cf>(std::complex<float>* to, const Packet4cf& from, Index stride)
125{
127 to[stride*0] = std::complex<float>(_mm_cvtss_f32(_mm_shuffle_ps(low, low, 0)),
128 _mm_cvtss_f32(_mm_shuffle_ps(low, low, 1)));
129 to[stride*1] = std::complex<float>(_mm_cvtss_f32(_mm_shuffle_ps(low, low, 2)),
130 _mm_cvtss_f32(_mm_shuffle_ps(low, low, 3)));
131
132 __m128 high = _mm256_extractf128_ps(from.v, 1);
133 to[stride*2] = std::complex<float>(_mm_cvtss_f32(_mm_shuffle_ps(high, high, 0)),
134 _mm_cvtss_f32(_mm_shuffle_ps(high, high, 1)));
135 to[stride*3] = std::complex<float>(_mm_cvtss_f32(_mm_shuffle_ps(high, high, 2)),
136 _mm_cvtss_f32(_mm_shuffle_ps(high, high, 3)));
137
138}
139
140template<> EIGEN_STRONG_INLINE std::complex<float> pfirst<Packet4cf>(const Packet4cf& a)
141{
143}
144
157
158template<> EIGEN_STRONG_INLINE std::complex<float> predux<Packet4cf>(const Packet4cf& a)
159{
162}
163
164template<> EIGEN_STRONG_INLINE std::complex<float> predux_mul<Packet4cf>(const Packet4cf& a)
165{
168}
169
171
180
182{
183 return Packet4cf(_mm256_shuffle_ps(x.v, x.v, _MM_SHUFFLE(2, 3, 0 ,1)));
184}
185
186//---------- double ----------
193
194#ifndef EIGEN_VECTORIZE_AVX512
195template<> struct packet_traits<std::complex<double> > : default_packet_traits
196{
199 enum {
202 size = 2,
204
215 HasSetLinear = 0
216 };
217};
218#endif
219
220template<> struct unpacket_traits<Packet2cd> {
221 typedef std::complex<double> type;
224 enum {
230 };
231};
232
237{
238 const __m256d mask = _mm256_castsi256_pd(_mm256_set_epi32(0x80000000,0x0,0x0,0x0,0x80000000,0x0,0x0,0x0));
239 return Packet2cd(_mm256_xor_pd(a.v,mask));
240}
241
243{
244 __m256d tmp1 = _mm256_shuffle_pd(a.v,a.v,0x0);
245 __m256d even = _mm256_mul_pd(tmp1, b.v);
246 __m256d tmp2 = _mm256_shuffle_pd(a.v,a.v,0xF);
247 __m256d tmp3 = _mm256_shuffle_pd(b.v,b.v,0x5);
248 __m256d odd = _mm256_mul_pd(tmp2, tmp3);
250}
251
252template <>
257
263
264template<> EIGEN_STRONG_INLINE Packet2cd pload <Packet2cd>(const std::complex<double>* from)
265{ EIGEN_DEBUG_ALIGNED_LOAD return Packet2cd(pload<Packet4d>((const double*)from)); }
266template<> EIGEN_STRONG_INLINE Packet2cd ploadu<Packet2cd>(const std::complex<double>* from)
268
269template<> EIGEN_STRONG_INLINE Packet2cd pset1<Packet2cd>(const std::complex<double>& from)
270{
271 // in case casting to a __m128d* is really not safe, then we can still fallback to this version: (much slower though)
272// return Packet2cd(_mm256_loadu2_m128d((const double*)&from,(const double*)&from));
273 return Packet2cd(_mm256_broadcast_pd((const __m128d*)(const void*)&from));
274}
275
276template<> EIGEN_STRONG_INLINE Packet2cd ploaddup<Packet2cd>(const std::complex<double>* from) { return pset1<Packet2cd>(*from); }
277
278template<> EIGEN_STRONG_INLINE void pstore <std::complex<double> >(std::complex<double> * to, const Packet2cd& from) { EIGEN_DEBUG_ALIGNED_STORE pstore((double*)to, from.v); }
279template<> EIGEN_STRONG_INLINE void pstoreu<std::complex<double> >(std::complex<double> * to, const Packet2cd& from) { EIGEN_DEBUG_UNALIGNED_STORE pstoreu((double*)to, from.v); }
280
281template<> EIGEN_DEVICE_FUNC inline Packet2cd pgather<std::complex<double>, Packet2cd>(const std::complex<double>* from, Index stride)
282{
283 return Packet2cd(_mm256_set_pd(std::imag(from[1*stride]), std::real(from[1*stride]),
284 std::imag(from[0*stride]), std::real(from[0*stride])));
285}
286
287template<> EIGEN_DEVICE_FUNC inline void pscatter<std::complex<double>, Packet2cd>(std::complex<double>* to, const Packet2cd& from, Index stride)
288{
290 to[stride*0] = std::complex<double>(_mm_cvtsd_f64(low), _mm_cvtsd_f64(_mm_shuffle_pd(low, low, 1)));
292 to[stride*1] = std::complex<double>(_mm_cvtsd_f64(high), _mm_cvtsd_f64(_mm_shuffle_pd(high, high, 1)));
293}
294
295template<> EIGEN_STRONG_INLINE std::complex<double> pfirst<Packet2cd>(const Packet2cd& a)
296{
297 __m128d low = _mm256_extractf128_pd(a.v, 0);
298 EIGEN_ALIGN16 double res[2];
299 _mm_store_pd(res, low);
300 return std::complex<double>(res[0],res[1]);
301}
302
307
308template<> EIGEN_STRONG_INLINE std::complex<double> predux<Packet2cd>(const Packet2cd& a)
309{
312}
313
314template<> EIGEN_STRONG_INLINE std::complex<double> predux_mul<Packet2cd>(const Packet2cd& a)
315{
318}
319
321
329
331{
332 return Packet2cd(_mm256_shuffle_pd(x.v, x.v, 0x5));
333}
334
335EIGEN_DEVICE_FUNC inline void
337 __m256d P0 = _mm256_castps_pd(kernel.packet[0].v);
338 __m256d P1 = _mm256_castps_pd(kernel.packet[1].v);
339 __m256d P2 = _mm256_castps_pd(kernel.packet[2].v);
340 __m256d P3 = _mm256_castps_pd(kernel.packet[3].v);
341
346
347 kernel.packet[1].v = _mm256_castpd_ps(_mm256_permute2f128_pd(T0, T2, 32));
348 kernel.packet[3].v = _mm256_castpd_ps(_mm256_permute2f128_pd(T0, T2, 49));
349 kernel.packet[0].v = _mm256_castpd_ps(_mm256_permute2f128_pd(T1, T3, 32));
350 kernel.packet[2].v = _mm256_castpd_ps(_mm256_permute2f128_pd(T1, T3, 49));
351}
352
353EIGEN_DEVICE_FUNC inline void
355 __m256d tmp = _mm256_permute2f128_pd(kernel.packet[0].v, kernel.packet[1].v, 0+(2<<4));
356 kernel.packet[1].v = _mm256_permute2f128_pd(kernel.packet[0].v, kernel.packet[1].v, 1+(3<<4));
357 kernel.packet[0].v = tmp;
358}
359
363
367
368} // end namespace internal
369
370} // end namespace Eigen
371
372#endif // EIGEN_COMPLEX_AVX_H
ArrayXXi a
Definition Array_initializer_list_23_cxx11.cpp:1
#define EIGEN_ALIGN16
Definition ConfigureVectorization.h:153
#define EIGEN_MAKE_CONJ_HELPER_CPLX_REAL(PACKET_CPLX, PACKET_REAL)
Definition ConjHelper.h:14
#define EIGEN_DEBUG_ALIGNED_STORE
Definition GenericPacketMath.h:35
#define EIGEN_DEBUG_ALIGNED_LOAD
Definition GenericPacketMath.h:27
#define EIGEN_DEBUG_UNALIGNED_STORE
Definition GenericPacketMath.h:39
#define EIGEN_DEBUG_UNALIGNED_LOAD
Definition GenericPacketMath.h:31
#define EIGEN_DEVICE_FUNC
Definition Macros.h:976
#define EIGEN_STRONG_INLINE
Definition Macros.h:917
cout<< "Here is the matrix m:"<< endl<< m<< endl;Matrix< ptrdiff_t, 3, 1 > res
Definition PartialRedux_count.cpp:3
Scalar * b
Definition benchVecAdd.cpp:17
set noclip points set clip one set noclip two set bar set border lt lw set xdata set ydata set zdata set x2data set y2data set boxwidth set dummy x
Definition gnuplot_common_settings.hh:12
@ Aligned32
Definition Constants.h:236
EIGEN_STRONG_INLINE std::complex< double > predux< Packet2cd >(const Packet2cd &a)
Definition Complex.h:308
EIGEN_STRONG_INLINE Packet2cf pconj(const Packet2cf &a)
Definition Complex.h:167
EIGEN_STRONG_INLINE Packet4cf ploadu< Packet4cf >(const std::complex< float > *from)
Definition Complex.h:97
EIGEN_DEVICE_FUNC Packet padd(const Packet &a, const Packet &b)
Definition GenericPacketMath.h:215
EIGEN_DEVICE_FUNC unpacket_traits< Packet >::type predux(const Packet &a)
Definition GenericPacketMath.h:875
EIGEN_STRONG_INLINE std::complex< float > predux_mul< Packet4cf >(const Packet4cf &a)
Definition Complex.h:164
EIGEN_STRONG_INLINE Packet2cd pcplxflip< Packet2cd >(const Packet2cd &x)
Definition Complex.h:330
EIGEN_STRONG_INLINE Packet4cf psub< Packet4cf >(const Packet4cf &a, const Packet4cf &b)
Definition Complex.h:65
EIGEN_STRONG_INLINE Packet2cd pset1< Packet2cd >(const std::complex< double > &from)
Definition Complex.h:269
EIGEN_STRONG_INLINE std::complex< float > pfirst< Packet4cf >(const Packet4cf &a)
Definition Complex.h:140
EIGEN_STRONG_INLINE Packet2cd ploaddup< Packet2cd >(const std::complex< double > *from)
Definition Complex.h:276
EIGEN_STRONG_INLINE Packet2cd psqrt< Packet2cd >(const Packet2cd &a)
Definition Complex.h:360
EIGEN_STRONG_INLINE void ptranspose(PacketBlock< Packet2cf, 2 > &kernel)
Definition Complex.h:224
EIGEN_STRONG_INLINE Packet2cf ploaddup< Packet2cf >(const std::complex< float > *from)
Definition Complex.h:125
EIGEN_STRONG_INLINE Packet2cd pand< Packet2cd >(const Packet2cd &a, const Packet2cd &b)
Definition Complex.h:259
EIGEN_STRONG_INLINE Packet4cf pxor< Packet4cf >(const Packet4cf &a, const Packet4cf &b)
Definition Complex.h:93
EIGEN_DEVICE_FUNC Packet pdiv(const Packet &a, const Packet &b)
Definition GenericPacketMath.h:244
EIGEN_STRONG_INLINE Packet2cd ploadu< Packet2cd >(const std::complex< double > *from)
Definition Complex.h:266
EIGEN_STRONG_INLINE std::complex< double > predux_mul< Packet2cd >(const Packet2cd &a)
Definition Complex.h:314
EIGEN_STRONG_INLINE std::complex< double > pfirst< Packet2cd >(const Packet2cd &a)
Definition Complex.h:295
EIGEN_STRONG_INLINE Packet2cd por< Packet2cd >(const Packet2cd &a, const Packet2cd &b)
Definition Complex.h:260
EIGEN_STRONG_INLINE Packet2cd ptrue< Packet2cd >(const Packet2cd &a)
Definition Complex.h:258
EIGEN_STRONG_INLINE Packet4cf ptrue< Packet4cf >(const Packet4cf &a)
Definition Complex.h:90
EIGEN_STRONG_INLINE Packet4cf pand< Packet4cf >(const Packet4cf &a, const Packet4cf &b)
Definition Complex.h:91
EIGEN_STRONG_INLINE Packet4cf pset1< Packet4cf >(const std::complex< float > &from)
Definition Complex.h:100
EIGEN_STRONG_INLINE Packet2cd pload< Packet2cd >(const std::complex< double > *from)
Definition Complex.h:264
EIGEN_STRONG_INLINE Packet2cf preverse(const Packet2cf &a)
Definition Complex.h:184
EIGEN_DEVICE_FUNC unpacket_traits< Packet >::type predux_mul(const Packet &a)
Definition GenericPacketMath.h:882
EIGEN_STRONG_INLINE Packet2cd pandnot< Packet2cd >(const Packet2cd &a, const Packet2cd &b)
Definition Complex.h:262
EIGEN_DEVICE_FUNC Packet pmul(const Packet &a, const Packet &b)
Definition GenericPacketMath.h:237
EIGEN_STRONG_INLINE Packet8h ptrue(const Packet8h &a)
Definition PacketMath.h:978
EIGEN_STRONG_INLINE Packet2cd psub< Packet2cd >(const Packet2cd &a, const Packet2cd &b)
Definition Complex.h:234
EIGEN_STRONG_INLINE Packet2cf pnegate(const Packet2cf &a)
Definition Complex.h:166
EIGEN_STRONG_INLINE Packet4cf ploaddup< Packet4cf >(const std::complex< float > *from)
Definition Complex.h:105
EIGEN_STRONG_INLINE Packet4cf pandnot< Packet4cf >(const Packet4cf &a, const Packet4cf &b)
Definition Complex.h:94
EIGEN_STRONG_INLINE bfloat16 pfirst(const Packet8bf &a)
Definition PacketMath.h:1429
EIGEN_DEVICE_FUNC void pstore(Scalar *to, const Packet &from)
Definition GenericPacketMath.h:696
EIGEN_STRONG_INLINE Packet2cd pxor< Packet2cd >(const Packet2cd &a, const Packet2cd &b)
Definition Complex.h:261
EIGEN_STRONG_INLINE Packet4cf padd< Packet4cf >(const Packet4cf &a, const Packet4cf &b)
Definition Complex.h:64
EIGEN_STRONG_INLINE Packet2cf pcmp_eq(const Packet2cf &a, const Packet2cf &b)
Definition Complex.h:231
EIGEN_DEVICE_FUNC void pstoreu(Scalar *to, const Packet &from)
Definition GenericPacketMath.h:700
EIGEN_STRONG_INLINE Packet8h pand(const Packet8h &a, const Packet8h &b)
Definition PacketMath.h:1050
EIGEN_STRONG_INLINE Packet2cd pmul< Packet2cd >(const Packet2cd &a, const Packet2cd &b)
Definition Complex.h:242
EIGEN_STRONG_INLINE Packet4cf pmul< Packet4cf >(const Packet4cf &a, const Packet4cf &b)
Definition Complex.h:76
EIGEN_STRONG_INLINE Packet4cf pcplxflip< Packet4cf >(const Packet4cf &x)
Definition Complex.h:181
EIGEN_STRONG_INLINE Packet4cf pload< Packet4cf >(const std::complex< float > *from)
Definition Complex.h:96
__m256 Packet8f
Definition PacketMath.h:31
EIGEN_STRONG_INLINE std::complex< float > predux< Packet4cf >(const Packet4cf &a)
Definition Complex.h:158
EIGEN_STRONG_INLINE Packet4cf por< Packet4cf >(const Packet4cf &a, const Packet4cf &b)
Definition Complex.h:92
EIGEN_STRONG_INLINE Packet2cd padd< Packet2cd >(const Packet2cd &a, const Packet2cd &b)
Definition Complex.h:233
__m256d Packet4d
Definition PacketMath.h:33
EIGEN_STRONG_INLINE Packet4cf psqrt< Packet4cf >(const Packet4cf &a)
Definition Complex.h:364
EIGEN_DEVICE_FUNC internal::add_const_on_value_type< EIGEN_MATHFUNC_RETVAL(real_ref, Scalar)>::type real_ref(const Scalar &x)
Definition MathFunctions.h:1237
Namespace containing all symbols from the Eigen library.
Definition bench_norm.cpp:85
EIGEN_DEFAULT_DENSE_INDEX_TYPE Index
The Index type as used for the API.
Definition Meta.h:74
Definition BandTriangularSolver.h:13
Definition BFloat16.h:88
Definition Complex.h:341
Definition Complex.h:188
EIGEN_STRONG_INLINE Packet2cd()
Definition Complex.h:189
__m256d v
Definition Complex.h:191
EIGEN_STRONG_INLINE Packet2cd(const __m256d &a)
Definition Complex.h:190
Definition Complex.h:31
Definition Complex.h:19
EIGEN_STRONG_INLINE Packet4cf(const __m256 &a)
Definition Complex.h:21
__m256 v
Definition Complex.h:22
EIGEN_STRONG_INLINE Packet4cf()
Definition Complex.h:20
Definition GenericPacketMath.h:43
@ HasSqrt
Definition GenericPacketMath.h:66
@ HasDiv
Definition GenericPacketMath.h:65
Definition GenericPacketMath.h:107
@ HasSub
Definition GenericPacketMath.h:118
@ HasMax
Definition GenericPacketMath.h:124
@ HasNegate
Definition GenericPacketMath.h:120
@ HasMul
Definition GenericPacketMath.h:119
@ HasAdd
Definition GenericPacketMath.h:117
@ HasSetLinear
Definition GenericPacketMath.h:126
@ HasMin
Definition GenericPacketMath.h:123
@ HasAbs2
Definition GenericPacketMath.h:122
@ HasAbs
Definition GenericPacketMath.h:121
@ HasHalfPacket
Definition GenericPacketMath.h:114
@ size
Definition GenericPacketMath.h:112
@ AlignedOnScalar
Definition GenericPacketMath.h:113
@ Vectorizable
Definition GenericPacketMath.h:111
Definition ForwardDeclarations.h:17
Packet1cd half
Definition Complex.h:222
Packet4d as_real
Definition Complex.h:223
std::complex< double > type
Definition Complex.h:221
std::complex< float > type
Definition Complex.h:52
Packet2cf half
Definition Complex.h:53
Packet8f as_real
Definition Complex.h:54
Definition GenericPacketMath.h:133
@ masked_load_available
Definition GenericPacketMath.h:141
@ size
Definition GenericPacketMath.h:138
@ masked_store_available
Definition GenericPacketMath.h:142
@ vectorizable
Definition GenericPacketMath.h:140
@ alignment
Definition GenericPacketMath.h:139
Definition datatypes.h:12