diff --git a/benchmarks/Benchmark_dwf.cc b/benchmarks/Benchmark_dwf.cc index 5cdb9ea1..6d91df0a 100644 --- a/benchmarks/Benchmark_dwf.cc +++ b/benchmarks/Benchmark_dwf.cc @@ -21,10 +21,13 @@ *************************************************************************************/ /* END LEGAL */ #include +#define CUDA_PROFILE +#ifdef CUDA_PROFILE +#include +#endif using namespace std; using namespace Grid; - ; template struct scal { @@ -178,6 +181,7 @@ int main (int argc, char ** argv) DomainWallFermionR Dw(Umu,*FGrid,*FrbGrid,*UGrid,*UrbGrid,mass,M5); int ncall =1000; + if (1) { FGrid->Barrier(); Dw.ZeroCounters(); @@ -320,7 +324,13 @@ int main (int argc, char ** argv) Dw.DhopEO(src_o,r_e,DaggerNo); double t0=usecond(); for(int i=0;iBarrier();