diff --git a/Grid/threads/Accelerator.h b/Grid/threads/Accelerator.h index 7336cfd4..06376131 100644 --- a/Grid/threads/Accelerator.h +++ b/Grid/threads/Accelerator.h @@ -458,7 +458,8 @@ inline void acceleratorCopySynchronise(void) { hipStreamSynchronize(copyStream); // Common on all GPU targets ////////////////////////////////////////////// #if defined(GRID_SYCL) || defined(GRID_CUDA) || defined(GRID_HIP) -#define accelerator_forNB( iter1, num1, nsimd, ... ) accelerator_for2dNB( iter1, num1, iter2, 1, nsimd, {__VA_ARGS__} ); +#define accelerator_forNB( iter1, num1, nsimd, ... ) accelerator_for2dNB( iter1, num1, iter2, 1, nsimd, {__VA_ARGS__} ); accelerator_barrier(dummy); + #define accelerator_for( iter, num, nsimd, ... ) \ accelerator_forNB(iter, num, nsimd, { __VA_ARGS__ } ); \ diff --git a/tests/core/Test_compact_wilson_clover_speedup.cc b/tests/core/Test_compact_wilson_clover_speedup.cc index 7a74ab19..695c8061 100644 --- a/tests/core/Test_compact_wilson_clover_speedup.cc +++ b/tests/core/Test_compact_wilson_clover_speedup.cc @@ -53,7 +53,7 @@ static int readInt(int* argc, char*** argv, std::string&& option, int defaultVal static float readFloat(int* argc, char*** argv, std::string&& option, float defaultValue) { std::string arg; - float ret = defaultValue; + double ret = defaultValue; if(checkPresent(argc, argv, option)) { arg = getContent(argc, argv, option); GridCmdOptionFloat(arg, ret); diff --git a/tests/core/Test_fft_matt.cc b/tests/core/Test_fft_matt.cc deleted file mode 100644 index 0c487852..00000000 --- a/tests/core/Test_fft_matt.cc +++ /dev/null @@ -1,244 +0,0 @@ - /************************************************************************************* - -Gamma::Algebra Gmu [] = { - Gamma::Algebra::GammaX, - Gamma::Algebra::GammaY, - Gamma::Algebra::GammaZ, - Gamma::Algebra::GammaT, - Gamma::Algebra::Gamma5 -}; - -int main (int argc, char ** argv) -{ - Grid_init(&argc,&argv); - - int threads = GridThread::GetThreads(); - std::cout< seeds({1,2,3,4}); - GridSerialRNG sRNG; sRNG.SeedFixedIntegers(seeds); // naughty seeding - GridParallelRNG pRNG(&GRID); - pRNG.SeedFixedIntegers(seeds); - - LatticeGaugeFieldD Umu(&GRID); - SU::ColdConfiguration(pRNG,Umu); // Unit gauge - - //////////////////////////////////////////////////// - // Wilson test - //////////////////////////////////////////////////// - { - LatticeFermionD src(&GRID); gaussian(pRNG,src); - LatticeFermionD src_p(&GRID); - LatticeFermionD tmp(&GRID); - LatticeFermionD ref(&GRID); - LatticeFermionD result(&GRID); - - RealD mass=0.1; - WilsonFermionD Dw(Umu,GRID,RBGRID,mass); - - Dw.M(src,ref); - std::cout << "Norm src "< 1/2 gmu (eip - emip) = i sinp gmu - Kinetic = Kinetic + sin(kmu)*ci*(Gamma(Gmu[mu])*src_p); - - } - - W = mass + sk2; - Kinetic = Kinetic + W * src_p; - - std::cout<<"Momentum space src "<< norm2(src_p)< HermOp(Dw); - ConjugateGradient CG(1.0e-10,10000); - CG(HermOp,src,result); - - //////////////////////////////////////////////////////////////////////// - std::cout << " Taking difference" <::RandomGaugeTransform(pRNG,U_GT,g); // Unit gauge - - LatticeFermionD src(&GRID); - LatticeFermionD tmp(&GRID); - LatticeFermionD ref(&GRID); - LatticeFermionD diff(&GRID); - - // could loop over colors - src=Zero(); - Coordinate point(4,0); // 0,0,0,0 - SpinColourVectorD ferm; - ferm=Zero(); - ferm()(0)(0) = ComplexD(1.0); - pokeSite(ferm,src,point); - - RealD mass=0.1; - WilsonFermionD Dw(U_GT,GRID,RBGRID,mass); - - // Momentum space prop - std::cout << " Solving by FFT and Feynman rules" < HermOp(Dw); - ConjugateGradient CG(1.0e-10,10000); - CG(HermOp,src,result); - - //////////////////////////////////////////////////////////////////////// - std::cout << " Taking difference" <