Control scalar execution or vector under generic. Disable Eigen vectorisation on powerpc / SUmmit

2025-07-25 08:57:08 +01:00 · 2018-04-12 12:32:57 -04:00
parent 6411caad67
commit a8a0bb85cc
3 changed files with 46 additions and 2 deletions
--- a/configure.ac
+++ b/configure.ac
@@ -234,6 +234,20 @@ AC_ARG_ENABLE([gen-simd-width],
            [ac_gen_simd_width=$enable_gen_simd_width],
            [ac_gen_simd_width=32])

+AC_ARG_ENABLE([gen-scalar],
+            [AS_HELP_STRING([--enable-gen-scalar=yes|no],
+            [enable generic scalar implementation])],
+            [ac_gen_scalar=$enable_gen_scalar],
+            [ac_gen_scalar=no])
+
+case ${ac_gen_scalar} in
+  yes)
+    AC_DEFINE([GENERIC_SCALAR],[1],[Use scalar data parallel loops])
+  ;;
+  *)
+  ;;
+esac
+
 ##################### Compiler dependent choices
 case ${CXX} in 
  nvcc) 
--- a/lib/simd/Grid_generic_types.h
+++ b/lib/simd/Grid_generic_types.h
@@ -29,9 +29,10 @@ Author: Antonin Portelli <antonin.portelli@me.com>

 static_assert(GEN_SIMD_WIDTH % 16u == 0, "SIMD vector size is not an integer multiple of 16 bytes");

-//#define VECTOR_LOOPS
+#undef VECTOR_LOOPS

 // playing with compiler pragmas
+
 #ifdef VECTOR_LOOPS
 #ifdef __clang__
 #define VECTOR_FOR(i, w, inc)						\
@@ -53,6 +54,31 @@ static_assert(GEN_SIMD_WIDTH % 16u == 0, "SIMD vector size is not an integer mul
 NAMESPACE_BEGIN(Grid);
 NAMESPACE_BEGIN(Optimization);

+#ifdef GENERIC_SCALAR
+
+// type traits giving the number of elements for each vector type
+template <typename T> struct W;
+template <> struct W<double> {
+  constexpr static unsigned int c = 1;
+  constexpr static unsigned int r = 2;
+};
+template <> struct W<float> {
+  constexpr static unsigned int c = 1;
+  constexpr static unsigned int r = 2;
+};
+template <> struct W<Integer> {
+  constexpr static unsigned int r = 1;
+};
+template <> struct W<uint16_t> {
+  constexpr static unsigned int c = 1;
+  constexpr static unsigned int r = 2;
+};
+// SIMD vector types
+template <typename T>
+struct vec {
+  T v[W<T>::r];
+};
+#else 
 // type traits giving the number of elements for each vector type
 template <typename T> struct W;
 template <> struct W<double> {
@@ -70,12 +96,12 @@ template <> struct W<uint16_t> {
  constexpr static unsigned int c = GEN_SIMD_WIDTH/4u;
  constexpr static unsigned int r = GEN_SIMD_WIDTH/2u;
 };
-  
 // SIMD vector types
 template <typename T>
 struct vec {
  alignas(GEN_SIMD_WIDTH) T v[W<T>::r];
 };
+#endif

 typedef vec<float>     vecf;
 typedef vec<double>    vecd;
--- a/lib/simd/Grid_vector_types.h
+++ b/lib/simd/Grid_vector_types.h
@@ -138,6 +138,7 @@ public:
  Vector_type v;

  static accelerator_inline constexpr int Nsimd(void) {
+    static_assert( (sizeof(Vector_type) / sizeof(Scalar_type) >= 1), " size mismatch " );
    return sizeof(Vector_type) / sizeof(Scalar_type);
  }

@@ -831,13 +832,16 @@ accelerator_inline void precisionChange(vComplexD *out,vComplexH *in,int nvec){
 accelerator_inline void precisionChange(vComplexF *out,vComplexH *in,int nvec){ precisionChange((vRealF *)out,(vRealH *)in,nvec);}

 // Check our vector types are of an appropriate size.
+
 #if defined QPX
 static_assert(2*sizeof(SIMD_Ftype) == sizeof(SIMD_Dtype), "SIMD vector lengths incorrect");
 static_assert(2*sizeof(SIMD_Ftype) == sizeof(SIMD_Itype), "SIMD vector lengths incorrect");
 #else
+#ifndef GENERIC_SCALAR
 static_assert(sizeof(SIMD_Ftype) == sizeof(SIMD_Dtype), "SIMD vector lengths incorrect");
 static_assert(sizeof(SIMD_Ftype) == sizeof(SIMD_Itype), "SIMD vector lengths incorrect");
 #endif
+#endif

 /////////////////////////////////////////
 // Some traits to recognise the types