#include using namespace std; using namespace Grid; using namespace Grid::QCD; int main (int argc, char ** argv) { Grid_init(&argc,&argv); const int Nvec=8; typedef Lattice< iVector< vReal,Nvec> > LatticeVec; int Nloop=1000; std::vector simd_layout = GridDefaultSimd(Nd,vReal::Nsimd()); std::vector mpi_layout = GridDefaultMpi(); int threads = GridThread::GetThreads(); std::cout< latt_size ({lat*mpi_layout[0],lat*mpi_layout[1],lat*mpi_layout[2],lat*mpi_layout[3]}); int vol = latt_size[0]*latt_size[1]*latt_size[2]*latt_size[3]; GridCartesian Grid(latt_size,simd_layout,mpi_layout); //GridParallelRNG pRNG(&Grid); pRNG.SeedRandomDevice(); LatticeVec z(&Grid); //random(pRNG,z); LatticeVec x(&Grid); //random(pRNG,x); LatticeVec y(&Grid); //random(pRNG,y); double a=2.0; double start=usecond(); for(int i=0;i &ret,double a,const Lattice &lhs,const Lattice &rhs){ axpy(z,a,x,y); } double stop=usecond(); double time = (stop-start)/Nloop*1000; double flops=vol*Nvec*2;// mul,add double bytes=3*vol*Nvec*sizeof(Real); std::cout< latt_size ({lat*mpi_layout[0],lat*mpi_layout[1],lat*mpi_layout[2],lat*mpi_layout[3]}); int vol = latt_size[0]*latt_size[1]*latt_size[2]*latt_size[3]; GridCartesian Grid(latt_size,simd_layout,mpi_layout); //GridParallelRNG pRNG(&Grid); pRNG.SeedRandomDevice(); LatticeVec z(&Grid); //random(pRNG,z); LatticeVec x(&Grid); //random(pRNG,x); LatticeVec y(&Grid); //random(pRNG,y); double a=2.0; double start=usecond(); for(int i=0;i latt_size ({lat*mpi_layout[0],lat*mpi_layout[1],lat*mpi_layout[2],lat*mpi_layout[3]}); int vol = latt_size[0]*latt_size[1]*latt_size[2]*latt_size[3]; GridCartesian Grid(latt_size,simd_layout,mpi_layout); //GridParallelRNG pRNG(&Grid); pRNG.SeedRandomDevice(); LatticeVec z(&Grid); //random(pRNG,z); LatticeVec x(&Grid); //random(pRNG,x); LatticeVec y(&Grid); //random(pRNG,y); RealD a=2.0; double start=usecond(); for(int i=0;i latt_size ({lat*mpi_layout[0],lat*mpi_layout[1],lat*mpi_layout[2],lat*mpi_layout[3]}); int vol = latt_size[0]*latt_size[1]*latt_size[2]*latt_size[3]; GridCartesian Grid(latt_size,simd_layout,mpi_layout); //GridParallelRNG pRNG(&Grid); pRNG.SeedRandomDevice(); LatticeVec z(&Grid); //random(pRNG,z); LatticeVec x(&Grid); //random(pRNG,x); LatticeVec y(&Grid); //random(pRNG,y); RealD a=2.0; ComplexD nn; double start=usecond(); for(int i=0;i