diff --git a/benchmarks/Benchmark_usqcd.cc b/benchmarks/Benchmark_usqcd.cc index eaa78e40..3b729b9e 100644 --- a/benchmarks/Benchmark_usqcd.cc +++ b/benchmarks/Benchmark_usqcd.cc @@ -219,7 +219,7 @@ public: uint64_t NN; - uint64_t lmax=32; + uint64_t lmax=40; #define NLOOP (1000*lmax*lmax*lmax*lmax/lat/lat/lat/lat) GridSerialRNG sRNG; sRNG.SeedFixedIntegers(std::vector({45,12,81,9})); @@ -454,11 +454,17 @@ public: pickCheckerboard(Even,src_e,src); pickCheckerboard(Odd,src_o,src); - const int num_cases = 1; +#ifdef AVX512 + const int num_cases = 3; +#else + const int num_cases = 2; +#endif std::string fmt("G/S/C ; G/O/C ; G/S/S ; G/O/S "); controls Cases [] = { - { WilsonKernelsStatic::OptGeneric , WilsonKernelsStatic::CommsAndCompute ,CartesianCommunicator::CommunicatorPolicyConcurrent } + { WilsonKernelsStatic::OptGeneric , WilsonKernelsStatic::CommsAndCompute ,CartesianCommunicator::CommunicatorPolicyConcurrent }, + { WilsonKernelsStatic::OptHandUnroll, WilsonKernelsStatic::CommsAndCompute ,CartesianCommunicator::CommunicatorPolicyConcurrent }, + { WilsonKernelsStatic::OptInlineAsm , WilsonKernelsStatic::CommsAndCompute ,CartesianCommunicator::CommunicatorPolicyConcurrent } }; for(int c=0;c({8,2,2,2}); -#else LebesgueOrder::Block = std::vector({2,2,2,2}); -#endif + Benchmark::Decomposition(); int do_su4=0; @@ -910,7 +919,7 @@ int main (int argc, char ** argv) } if ( do_blas ) { -#if defined(GRID_CUDA) || defined(GRID_HIP) +#if defined(GRID_CUDA) || defined(GRID_HIP) || defined(GRID_SYCL) std::cout<