From 3d517bbd2a9866ef341c277b91e09d7dd901d73f Mon Sep 17 00:00:00 2001 From: Peter Boyle Date: Fri, 22 Dec 2023 18:06:13 -0500 Subject: [PATCH] Synchronise decouple from the launch Speeds up multileg stencils --- Grid/algorithms/multigrid/BatchedBlas.h | 32 +++++++++++-------------- 1 file changed, 14 insertions(+), 18 deletions(-) diff --git a/Grid/algorithms/multigrid/BatchedBlas.h b/Grid/algorithms/multigrid/BatchedBlas.h index eca52657..47468ea6 100644 --- a/Grid/algorithms/multigrid/BatchedBlas.h +++ b/Grid/algorithms/multigrid/BatchedBlas.h @@ -204,13 +204,12 @@ public: } } #endif - synchronise(); RealD t1=usecond(); RealD flops = 8.0*m*n*k*batchCount; RealD bytes = 1.0*sizeof(ComplexD)*(m*k+k*n+m*n)*batchCount; - std::cout <