vectorization_logic.cpp
Go to the documentation of this file.
1 // This file is part of Eigen, a lightweight C++ template library
2 // for linear algebra.
3 //
4 // Copyright (C) 2015 Gael Guennebaud <gael.guennebaud@inria.fr>
5 //
6 // This Source Code Form is subject to the terms of the Mozilla
7 // Public License v. 2.0. If a copy of the MPL was not distributed
8 // with this file, You can obtain one at http://mozilla.org/MPL/2.0/.
9 
10 #ifdef EIGEN_TEST_PART_1
11 #define EIGEN_UNALIGNED_VECTORIZE 1
12 #endif
13 
14 #ifdef EIGEN_TEST_PART_2
15 #define EIGEN_UNALIGNED_VECTORIZE 0
16 #endif
17 
18 #ifdef EIGEN_DEFAULT_TO_ROW_MAJOR
19 #undef EIGEN_DEFAULT_TO_ROW_MAJOR
20 #endif
21 #define EIGEN_DEBUG_ASSIGN
22 #include "main.h"
23 #include <typeinfo>
24 
25 using internal::demangle_flags;
26 using internal::demangle_traversal;
27 using internal::demangle_unrolling;
28 
29 template<typename Dst, typename Src>
30 bool test_assign(const Dst&, const Src&, int traversal, int unrolling)
31 {
32  typedef internal::copy_using_evaluator_traits<internal::evaluator<Dst>,internal::evaluator<Src>, internal::assign_op<typename Dst::Scalar,typename Src::Scalar> > traits;
33  bool res = traits::Traversal==traversal;
34  if(unrolling==InnerUnrolling+CompleteUnrolling)
35  res = res && (int(traits::Unrolling)==InnerUnrolling || int(traits::Unrolling)==CompleteUnrolling);
36  else
37  res = res && int(traits::Unrolling)==unrolling;
38  if(!res)
39  {
40  std::cerr << "Src: " << demangle_flags(Src::Flags) << std::endl;
41  std::cerr << " " << demangle_flags(internal::evaluator<Src>::Flags) << std::endl;
42  std::cerr << "Dst: " << demangle_flags(Dst::Flags) << std::endl;
43  std::cerr << " " << demangle_flags(internal::evaluator<Dst>::Flags) << std::endl;
44  traits::debug();
45  std::cerr << " Expected Traversal == " << demangle_traversal(traversal)
46  << " got " << demangle_traversal(traits::Traversal) << "\n";
47  std::cerr << " Expected Unrolling == " << demangle_unrolling(unrolling)
48  << " got " << demangle_unrolling(traits::Unrolling) << "\n";
49  }
50  return res;
51 }
52 
53 template<typename Dst, typename Src>
54 bool test_assign(int traversal, int unrolling)
55 {
56  typedef internal::copy_using_evaluator_traits<internal::evaluator<Dst>,internal::evaluator<Src>, internal::assign_op<typename Dst::Scalar,typename Src::Scalar> > traits;
57  bool res = traits::Traversal==traversal && traits::Unrolling==unrolling;
58  if(!res)
59  {
60  std::cerr << "Src: " << demangle_flags(Src::Flags) << std::endl;
61  std::cerr << " " << demangle_flags(internal::evaluator<Src>::Flags) << std::endl;
62  std::cerr << "Dst: " << demangle_flags(Dst::Flags) << std::endl;
63  std::cerr << " " << demangle_flags(internal::evaluator<Dst>::Flags) << std::endl;
64  traits::debug();
65  std::cerr << " Expected Traversal == " << demangle_traversal(traversal)
66  << " got " << demangle_traversal(traits::Traversal) << "\n";
67  std::cerr << " Expected Unrolling == " << demangle_unrolling(unrolling)
68  << " got " << demangle_unrolling(traits::Unrolling) << "\n";
69  }
70  return res;
71 }
72 
73 template<typename Xpr>
74 bool test_redux(const Xpr&, int traversal, int unrolling)
75 {
76  typedef typename Xpr::Scalar Scalar;
77  typedef internal::redux_traits<internal::scalar_sum_op<Scalar,Scalar>,internal::redux_evaluator<Xpr> > traits;
78 
79  bool res = traits::Traversal==traversal && traits::Unrolling==unrolling;
80  if(!res)
81  {
82  std::cerr << demangle_flags(Xpr::Flags) << std::endl;
83  std::cerr << demangle_flags(internal::evaluator<Xpr>::Flags) << std::endl;
84  traits::debug();
85 
86  std::cerr << " Expected Traversal == " << demangle_traversal(traversal)
87  << " got " << demangle_traversal(traits::Traversal) << "\n";
88  std::cerr << " Expected Unrolling == " << demangle_unrolling(unrolling)
89  << " got " << demangle_unrolling(traits::Unrolling) << "\n";
90  }
91  return res;
92 }
93 
94 template<typename Scalar, bool Enable = internal::packet_traits<Scalar>::Vectorizable>
96 {
97  typedef internal::packet_traits<Scalar> PacketTraits;
98 
101  enum {
104  };
105  static void run()
106  {
107 
110  typedef Matrix<Scalar,Dynamic,Dynamic> MatrixXX;
111  typedef Matrix<Scalar,PacketSize,PacketSize> Matrix11;
117 
118  typedef Matrix<Scalar,
119  (PacketSize==8 ? 4 : PacketSize==4 ? 2 : PacketSize==2 ? 1 : /*PacketSize==1 ?*/ 1),
120  (PacketSize==8 ? 2 : PacketSize==4 ? 2 : PacketSize==2 ? 2 : /*PacketSize==1 ?*/ 1)
121  > Matrix1;
122 
123  typedef Matrix<Scalar,
124  (PacketSize==8 ? 4 : PacketSize==4 ? 2 : PacketSize==2 ? 1 : /*PacketSize==1 ?*/ 1),
125  (PacketSize==8 ? 2 : PacketSize==4 ? 2 : PacketSize==2 ? 2 : /*PacketSize==1 ?*/ 1),
126  DontAlign|((Matrix1::Flags&RowMajorBit)?RowMajor:ColMajor)> Matrix1u;
127 
128  // this type is made such that it can only be vectorized when viewed as a linear 1D vector
129  typedef Matrix<Scalar,
130  (PacketSize==8 ? 4 : PacketSize==4 ? 6 : PacketSize==2 ? ((Matrix11::Flags&RowMajorBit)?2:3) : /*PacketSize==1 ?*/ 1),
131  (PacketSize==8 ? 6 : PacketSize==4 ? 2 : PacketSize==2 ? ((Matrix11::Flags&RowMajorBit)?3:2) : /*PacketSize==1 ?*/ 3)
132  > Matrix3;
133 
134  #if !EIGEN_GCC_AND_ARCH_DOESNT_WANT_STACK_ALIGNMENT
139  VERIFY(test_assign(Vector1(),Vector1().cwiseProduct(Vector1()),
141  VERIFY(test_assign(Vector1(),Vector1().template cast<Scalar>(),
143 
144 
149  VERIFY(test_assign(Vector1(),Vector1().cwiseProduct(Vector1()),
151 
152  VERIFY(test_assign(Matrix44(),Matrix44()+Matrix44(),
154 
155  VERIFY(test_assign(Matrix44u(),Matrix44()+Matrix44(),
158 
160  (Matrix1::InnerSizeAtCompileTime % PacketSize)==0 ? InnerVectorizedTraversal : LinearVectorizedTraversal,
162 
163  VERIFY(test_assign(Matrix1u(),Matrix1()+Matrix1(),
164  EIGEN_UNALIGNED_VECTORIZE ? ((Matrix1::InnerSizeAtCompileTime % PacketSize)==0 ? InnerVectorizedTraversal : LinearVectorizedTraversal)
165  : LinearTraversal, CompleteUnrolling));
166 
167  VERIFY(test_assign(Matrix44c().col(1),Matrix44c().col(2)+Matrix44c().col(3),
169 
170  VERIFY(test_assign(Matrix44r().row(2),Matrix44r().row(1)+Matrix44r().row(1),
172 
173  if(PacketSize>1)
174  {
175  typedef Matrix<Scalar,3,3,ColMajor> Matrix33c;
177  VERIFY(test_assign(Matrix33c().row(2),Matrix33c().row(1)+Matrix33c().row(1),
178  LinearTraversal,CompleteUnrolling));
180  EIGEN_UNALIGNED_VECTORIZE ? (HalfPacketSize==1 ? InnerVectorizedTraversal : LinearVectorizedTraversal) : (HalfPacketSize==1 ? InnerVectorizedTraversal : LinearTraversal), CompleteUnrolling));
181  VERIFY(test_assign(Matrix33c().col(0),Matrix33c().col(1)+Matrix33c().col(1),
182  EIGEN_UNALIGNED_VECTORIZE ? (HalfPacketSize==1 ? InnerVectorizedTraversal : LinearVectorizedTraversal) : (HalfPacketSize==1 ? SliceVectorizedTraversal : LinearTraversal),
183  ((!EIGEN_UNALIGNED_VECTORIZE) && HalfPacketSize==1) ? NoUnrolling : CompleteUnrolling));
184 
185  VERIFY(test_assign(Matrix3(),Matrix3().cwiseProduct(Matrix3()),
186  LinearVectorizedTraversal,CompleteUnrolling));
187 
190  EIGEN_UNALIGNED_VECTORIZE ? LinearVectorizedTraversal :
191  LinearTraversal,
192  NoUnrolling));
193 
194  VERIFY(test_assign(Matrix11(), Matrix11()+Matrix11(),InnerVectorizedTraversal,CompleteUnrolling));
195 
196 
197  VERIFY(test_assign(Matrix11(),Matrix<Scalar,17,17>().template block<PacketSize,PacketSize>(2,3)+Matrix<Scalar,17,17>().template block<PacketSize,PacketSize>(8,4),
199 
200  VERIFY(test_assign(Vector1(),Matrix11()*Vector1(),
201  InnerVectorizedTraversal,CompleteUnrolling));
202 
203  VERIFY(test_assign(Matrix11(),Matrix11().lazyProduct(Matrix11()),
204  InnerVectorizedTraversal,InnerUnrolling+CompleteUnrolling));
205  }
206 
208  LinearVectorizedTraversal,CompleteUnrolling));
209 
211  LinearVectorizedTraversal,CompleteUnrolling));
212 
214  LinearVectorizedTraversal,CompleteUnrolling));
215 
217  LinearVectorizedTraversal,CompleteUnrolling));
218 
219  VERIFY(test_redux(Matrix3(),
220  LinearVectorizedTraversal,CompleteUnrolling));
221 
222  VERIFY(test_redux(Matrix44(),
223  LinearVectorizedTraversal,NoUnrolling));
224 
225  VERIFY(test_redux(Matrix44().template block<(Matrix1::Flags&RowMajorBit)?4:PacketSize,(Matrix1::Flags&RowMajorBit)?PacketSize:4>(1,2),
227 
228  VERIFY(test_redux(Matrix44c().template block<2*PacketSize,1>(1,2),
229  LinearVectorizedTraversal,CompleteUnrolling));
230 
231  VERIFY(test_redux(Matrix44r().template block<1,2*PacketSize>(2,1),
232  LinearVectorizedTraversal,CompleteUnrolling));
233 
236  Matrix22
238 
241  Matrix<Scalar,EIGEN_PLAIN_ENUM_MAX(2,PacketSize),EIGEN_PLAIN_ENUM_MAX(2,PacketSize)>
243 
244  VERIFY((test_assign(Matrix11(), Matrix<Scalar,PacketSize,EIGEN_PLAIN_ENUM_MIN(2,PacketSize)>()*Matrix<Scalar,EIGEN_PLAIN_ENUM_MIN(2,PacketSize),PacketSize>(),
245  InnerVectorizedTraversal, CompleteUnrolling)));
246  #endif
247 
248  VERIFY(test_assign(MatrixXX(10,10),MatrixXX(20,20).block(10,10,2,3),
249  SliceVectorizedTraversal,NoUnrolling));
250 
252  LinearVectorizedTraversal,NoUnrolling));
253  }
254 };
255 
256 template<typename Scalar> struct vectorization_logic<Scalar,false>
257 {
258  static void run() {}
259 };
260 
264 {
265  typedef internal::packet_traits<Scalar> PacketTraits;
267  enum {
269  };
270  static void run()
271  {
272 
274  typedef Matrix<Scalar,PacketSize,PacketSize> Matrix11;
278 // typedef Matrix<Scalar,(Matrix11::Flags&RowMajorBit)?16:4*PacketSize,(Matrix11::Flags&RowMajorBit)?4*PacketSize:16> Matrix44;
279 // typedef Matrix<Scalar,(Matrix11::Flags&RowMajorBit)?16:4*PacketSize,(Matrix11::Flags&RowMajorBit)?4*PacketSize:16,DontAlign|EIGEN_DEFAULT_MATRIX_STORAGE_ORDER_OPTION> Matrix44u;
280 // typedef Matrix<Scalar,4*PacketSize,4*PacketSize,ColMajor> Matrix44c;
281 // typedef Matrix<Scalar,4*PacketSize,4*PacketSize,RowMajor> Matrix44r;
282 
283  typedef Matrix<Scalar,
284  (PacketSize==8 ? 4 : PacketSize==4 ? 2 : PacketSize==2 ? 1 : /*PacketSize==1 ?*/ 1),
285  (PacketSize==8 ? 2 : PacketSize==4 ? 2 : PacketSize==2 ? 2 : /*PacketSize==1 ?*/ 1)
286  > Matrix1;
287 
288  typedef Matrix<Scalar,
289  (PacketSize==8 ? 4 : PacketSize==4 ? 2 : PacketSize==2 ? 1 : /*PacketSize==1 ?*/ 1),
290  (PacketSize==8 ? 2 : PacketSize==4 ? 2 : PacketSize==2 ? 2 : /*PacketSize==1 ?*/ 1),
291  DontAlign|((Matrix1::Flags&RowMajorBit)?RowMajor:ColMajor)> Matrix1u;
292 
293  // this type is made such that it can only be vectorized when viewed as a linear 1D vector
294  typedef Matrix<Scalar,
295  (PacketSize==8 ? 4 : PacketSize==4 ? 6 : PacketSize==2 ? ((Matrix11::Flags&RowMajorBit)?2:3) : /*PacketSize==1 ?*/ 1),
296  (PacketSize==8 ? 6 : PacketSize==4 ? 2 : PacketSize==2 ? ((Matrix11::Flags&RowMajorBit)?3:2) : /*PacketSize==1 ?*/ 3)
297  > Matrix3;
298 
299  #if !EIGEN_GCC_AND_ARCH_DOESNT_WANT_STACK_ALIGNMENT
304  VERIFY(test_assign(Vector1(),Vector1().template segment<PacketSize>(0).derived(),
308  VERIFY(test_assign(Vector1(),(Scalar(2.1)*Vector1().template segment<PacketSize>(0)-Vector1().template segment<PacketSize>(0)).derived(),
310  VERIFY(test_assign(Vector1(),Vector1().cwiseProduct(Vector1()),
312  VERIFY(test_assign(Vector1(),Vector1().template cast<Scalar>(),
314 
315 
320  VERIFY(test_assign(Vector1(),Vector1().cwiseProduct(Vector1()),
322 
323  VERIFY(test_assign(Matrix57(),Matrix57()+Matrix57(),
325 
326  VERIFY(test_assign(Matrix57u(),Matrix57()+Matrix57(),
329 
330  VERIFY(test_assign(Matrix1u(),Matrix1()+Matrix1(),
331  EIGEN_UNALIGNED_VECTORIZE ? ((Matrix1::InnerSizeAtCompileTime % PacketSize)==0 ? InnerVectorizedTraversal : LinearVectorizedTraversal) : LinearTraversal,CompleteUnrolling));
332 
333  if(PacketSize>1)
334  {
335  typedef Matrix<Scalar,3,3,ColMajor> Matrix33c;
336  VERIFY(test_assign(Matrix33c().row(2),Matrix33c().row(1)+Matrix33c().row(1),
337  LinearTraversal,CompleteUnrolling));
338  VERIFY(test_assign(Matrix33c().col(0),Matrix33c().col(1)+Matrix33c().col(1),
339  EIGEN_UNALIGNED_VECTORIZE ? (PacketSize==1 ? InnerVectorizedTraversal : LinearVectorizedTraversal) : LinearTraversal,CompleteUnrolling));
340 
341  VERIFY(test_assign(Matrix3(),Matrix3().cwiseQuotient(Matrix3()),
342  PacketTraits::HasDiv ? LinearVectorizedTraversal : LinearTraversal,CompleteUnrolling));
343 
345  EIGEN_UNALIGNED_VECTORIZE ? (PacketSize==1 ? InnerVectorizedTraversal : LinearVectorizedTraversal) : LinearTraversal,
346  NoUnrolling));
347 
348  VERIFY(test_assign(Matrix11(),Matrix<Scalar,17,17>().template block<PacketSize,PacketSize>(2,3)+Matrix<Scalar,17,17>().template block<PacketSize,PacketSize>(8,4),
350 
351  VERIFY(test_assign(Vector1(),Matrix11()*Vector1(),
352  InnerVectorizedTraversal,CompleteUnrolling));
353 
354  VERIFY(test_assign(Matrix11(),Matrix11().lazyProduct(Matrix11()),
355  InnerVectorizedTraversal,InnerUnrolling+CompleteUnrolling));
356  }
357 
359  LinearVectorizedTraversal,CompleteUnrolling));
360 
362  LinearVectorizedTraversal,CompleteUnrolling));
363 
364  VERIFY(test_redux(Matrix3(),
365  LinearVectorizedTraversal,CompleteUnrolling));
366 
367  VERIFY(test_redux(Matrix35(),
368  LinearVectorizedTraversal,CompleteUnrolling));
369 
370  VERIFY(test_redux(Matrix57().template block<PacketSize,3>(1,0),
372 
375  Matrix<Scalar,EIGEN_PLAIN_ENUM_MAX(2,PacketSize),EIGEN_PLAIN_ENUM_MAX(2,PacketSize)>
377 
380  #endif
381  }
382 };
383 
384 template<typename Scalar> struct vectorization_logic_half<Scalar,false>
385 {
386  static void run() {}
387 };
388 
390 {
391 
392 #ifdef EIGEN_VECTORIZE
393 
397  CALL_SUBTEST( vectorization_logic<std::complex<float> >::run() );
398  CALL_SUBTEST( vectorization_logic<std::complex<double> >::run() );
399 
403  CALL_SUBTEST( vectorization_logic_half<std::complex<float> >::run() );
404  CALL_SUBTEST( vectorization_logic_half<std::complex<double> >::run() );
405 
406  if(internal::packet_traits<float>::Vectorizable)
407  {
410 
413  }
414 
415  if(internal::packet_traits<double>::Vectorizable)
416  {
419 
422  }
423 #endif // EIGEN_VECTORIZE
424 
425 }
int array[24]
internal::packet_traits< Scalar >::type PacketType
SCALAR Scalar
Definition: bench_gemm.cpp:33
internal::packet_traits< Scalar > PacketTraits
void test_vectorization_logic()
m m block(1, 0, 2, 2)<< 4
return int(ret)+1
Eigen::Vector3d Vector3
Definition: Vector.h:43
Eigen::Matrix< double, 1, 1 > Vector1
Definition: testEvent.cpp:34
A matrix or vector expression mapping an existing array of data.
Definition: Map.h:94
Matrix< Scalar, Dynamic, 1 > VectorX
Definition: sparse_lu.cpp:41
#define EIGEN_PLAIN_ENUM_MAX(a, b)
Definition: Macros.h:876
const unsigned int RowMajorBit
Definition: Constants.h:61
internal::unpacket_traits< typename internal::packet_traits< Scalar >::type >::half PacketType
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE const CwiseBinaryOp< internal::scalar_quotient_op< Scalar >, const Derived, const OtherDerived > cwiseQuotient(const EIGEN_CURRENT_STORAGE_BASE_CLASS< OtherDerived > &other) const
Eigen::Matrix< double, 1, 1 > Matrix1
Definition: timeRot2.cpp:77
cout<< "Here is the matrix m:"<< endl<< m<< endl;Matrix< ptrdiff_t, 3, 1 > res
Scalar Scalar int size
Definition: benchVecAdd.cpp:17
m row(1)
Convenience specialization of Stride to specify only an inner stride See class Map for some examples...
Definition: Stride.h:90
internal::unpacket_traits< PacketType >::half HalfPacketType
static bool debug
bool test_assign(const Dst &, const Src &, int traversal, int unrolling)
#define CALL_SUBTEST(FUNC)
Definition: main.h:342
#define VERIFY(a)
Definition: main.h:325
#define EIGEN_PLAIN_ENUM_MIN(a, b)
Definition: Macros.h:875
m col(1)
The matrix class, also used for vectors and row-vectors.
bool test_redux(const Xpr &, int traversal, int unrolling)
Convenience specialization of Stride to specify only an outer stride See class Map for some examples...
Definition: Stride.h:101
internal::packet_traits< Scalar > PacketTraits
#define EIGEN_UNALIGNED_VECTORIZE
Definition: Macros.h:786


gtsam
Author(s):
autogenerated on Sat May 8 2021 02:51:23