Select AVX2 even if the data size is not a multiple of 8

commit: eb85b97339e3791d533592bac20999b1b3ebca09 [log] [tgz]
author: Francesco Mazzoli <f@mazzo.li> Mon Nov 29 21:13:24 2021 +0000
committer: Rasmus Munk Larsen <rmlarsen@google.com> Mon Nov 29 21:13:24 2021 +0000
tree: 12cbf8de9fe0d5e2560c38be3c9025c667b0712d
parent: eef33946b79663a9e9aec41c14579f9ae581b389 [diff] [blame]
diff --git a/test/vectorization_logic.cpp b/test/vectorization_logic.cpp
index 602e9f1..62d3f60 100644
--- a/test/vectorization_logic.cpp
+++ b/test/vectorization_logic.cpp

@@ -258,7 +258,38 @@
 
     VERIFY(test_redux(VectorX(10),
       LinearVectorizedTraversal,NoUnrolling));
+
+    // Some static checks for packet-picking -- see
+    // <https://gitlab.com/libeigen/eigen/merge_requests/46#note_271497656> for context.
+
+    // Any multiple of the packet size itself will result in the normal packet
+    STATIC_CHECK((
+      internal::is_same<typename internal::find_best_packet<Scalar, PacketSize>::type, PacketType>::value
+    ));
+    STATIC_CHECK((
+      internal::is_same<typename internal::find_best_packet<Scalar, PacketSize*2>::type, PacketType>::value
+    ));
+    STATIC_CHECK((
+      internal::is_same<typename internal::find_best_packet<Scalar, PacketSize*5>::type, PacketType>::value
+    ));
+    // Moreover, situations where the size is _not_ a multiple but picking the full packet
+    // is convenient will also work, but only with unaligned vectorize
+    STATIC_CHECK((
+      !(EIGEN_UNALIGNED_VECTORIZE || PacketSize == HalfPacketSize) ||
+      internal::is_same<typename internal::find_best_packet<Scalar, PacketSize*5+1>::type, PacketType>::value
+    ));
+    STATIC_CHECK((
+      !(EIGEN_UNALIGNED_VECTORIZE || PacketSize == HalfPacketSize) ||
+      internal::is_same<typename internal::find_best_packet<Scalar, PacketSize*5+2>::type, PacketType>::value
+    ));
+    // In situations where the picking the full-packet would be detrimental the half-packet
+    // is chosen.
+    STATIC_CHECK((
+      !(PacketSize > 2) ||
+      internal::is_same<typename internal::find_best_packet<Scalar, PacketSize*2-1>::type, HalfPacketType>::value
+    ));
   }
+
 };
 
 template<typename Scalar> struct vectorization_logic<Scalar,false>
commit	eb85b97339e3791d533592bac20999b1b3ebca09	[log] [tgz]
author	Francesco Mazzoli <f@mazzo.li>	Mon Nov 29 21:13:24 2021 +0000
committer	Rasmus Munk Larsen <rmlarsen@google.com>	Mon Nov 29 21:13:24 2021 +0000
tree	12cbf8de9fe0d5e2560c38be3c9025c667b0712d
parent	eef33946b79663a9e9aec41c14579f9ae581b389 [diff] [blame]