diff --git a/benchmarks/Benchmark_usqcd.cc b/benchmarks/Benchmark_usqcd.cc index 3b729b9e..9c0f5ab5 100644 --- a/benchmarks/Benchmark_usqcd.cc +++ b/benchmarks/Benchmark_usqcd.cc @@ -261,23 +261,25 @@ public: fprintf(FP,"\n\n"); }; - + template static void BLAS(void) { //int nbasis, int nrhs, int coarseVol int basis[] = { 16,32,64 }; - int rhs[] = { 8,16,32 }; - int vol = 4*4*4*4; + int rhs[] = { 8,12,16 }; + int vol = 8*8*8*8; + int blk = 4*4*4*4; GridBLAS blas; - + + int fpbits = sizeof(CComplex)*4; std::cout<(M,N,K,BATCH); fprintf(FP,"%d, %d, %d, %d, %f\n", M, N, K, BATCH, p); @@ -299,9 +301,9 @@ public: for(int r=0;r<3;r++){ int M=basis[b]; int N=rhs[r]; - int K=vol; + int K=blk; int BATCH=vol; - double p=blas.benchmark(M,N,K,BATCH); + double p=blas.benchmark(M,N,K,BATCH); fprintf(FP,"%d, %d, %d, %d, %f\n", M, N, K, BATCH, p); std::cout<(M,N,K,BATCH); fprintf(FP,"%d, %d, %d, %d, %f\n", M, N, K, BATCH, p); std::cout< L_list({8,12,16,24,32}); @@ -877,6 +880,7 @@ int main (int argc, char ** argv) std::vector staggered; int Ls=1; + if (do_dslash){ std::cout<(); + Benchmark::BLAS(); } if ( do_su4 ) { @@ -941,6 +945,7 @@ int main (int argc, char ** argv) Benchmark::Comms(); } + if(do_dslash){ std::cout<