#include "Grid.h" #include "Grid_vRealD.h" #include "Grid_vRealF.h" #include "Grid_vComplexD.h" #include "Grid_vComplexF.h" #include "Grid_Cartesian.h" #include "Grid_Lattice.h" using namespace std; using namespace dpo; using namespace dpo::QCD; int main (int argc, char ** argv) { Grid_init(&argc,&argv); std::vector latt_size(4); std::vector simd_layout(4); std::vector mpi_layout(4); mpi_layout[0]=4; mpi_layout[1]=2; mpi_layout[2]=4; mpi_layout[3]=2; #ifdef AVX512 for(int omp=128;omp<236;omp+=16){ #else for(int omp=1;omp<8;omp*=20){ #endif #ifdef OMP omp_set_num_threads(omp); #endif for(int lat=16;lat<=16;lat+=40){ latt_size[0] = lat; latt_size[1] = lat; latt_size[2] = lat; latt_size[3] = lat; double volume = latt_size[0]*latt_size[1]*latt_size[2]*latt_size[3]; #ifdef AVX512 simd_layout[0] = 1; simd_layout[1] = 2; simd_layout[2] = 2; simd_layout[3] = 2; #endif #if defined (AVX1)|| defined (AVX2) simd_layout[0] = 1; simd_layout[1] = 1; simd_layout[2] = 2; simd_layout[3] = 2; #endif #if defined (SSE2) simd_layout[0] = 1; simd_layout[1] = 1; simd_layout[2] = 1; simd_layout[3] = 2; #endif GridCartesian Fine(latt_size,simd_layout,mpi_layout); GridRedBlackCartesian rbFine(latt_size,simd_layout,mpi_layout); LatticeColourMatrix Foo(&Fine); LatticeColourMatrix Bar(&Fine); LatticeSpinColourMatrix scFoo(&Fine); LatticeSpinColourMatrix scBar(&Fine); LatticeColourMatrix Shifted(&Fine); LatticeColourMatrix ShiftedCheck(&Fine); LatticeColourMatrix rShifted(&rbFine); LatticeColourMatrix bShifted(&rbFine); LatticeColourMatrix rFoo(&rbFine); LatticeColourMatrix bFoo(&rbFine); LatticeColourMatrix FooBar(&Fine); LatticeSpinColourMatrix scFooBar(&Fine); LatticeColourVector cVec(&Fine); LatticeSpinVector sVec(&Fine); LatticeSpinColourVector scVec(&Fine); LatticeColourMatrix cMat(&Fine); LatticeSpinMatrix sMat(&Fine); LatticeSpinColourMatrix scMat(&Fine); LatticeComplex scalar(&Fine); SpinMatrix GammaFive; iSpinMatrix iGammaFive; ColourMatrix cmat; random(Foo); gaussian(Bar); random(scFoo); random(scBar); random(cMat); random(sMat); random(scMat); random(cVec); random(sVec); random(scVec); fflush(stdout); cVec = cMat * cVec; // LatticeColourVector = LatticeColourMatrix * LatticeColourVector sVec = sMat * sVec; // LatticeSpinVector = LatticeSpinMatrix * LatticeSpinVector scVec= scMat * scVec;// LatticeSpinColourVector = LatticeSpinColourMatrix * LatticeSpinColourVector scVec= cMat * scVec; // LatticeSpinColourVector = LatticeColourMatrix * LatticeSpinColourVector scVec= sMat * scVec; // LatticeSpinColourVector = LatticeSpinMatrix * LatticeSpinColourVector cMat = outerProduct(cVec,cVec); scalar = localInnerProduct(cVec,cVec); scMat = sMat*scMat; // LatticeSpinColourMatrix = LatticeSpinMatrix * LatticeSpinColourMatrix // Non-lattice (const objects) * Lattice ColourMatrix cm; SpinColourMatrix scm; scMat = cMat*scMat; scm = cm * scm; // SpinColourMatrix = ColourMatrix * SpinColourMatrix scm = scm *cm; // SpinColourMatrix = SpinColourMartix * ColourMatrix scm = GammaFive * scm ; // SpinColourMatrix = SpinMatrix * SpinColourMatrix scm = scm* GammaFive ; // SpinColourMatrix = SpinColourMatrix * SpinMatrix sMat = adj(sMat); // LatticeSpinMatrix adjoint sMat = iGammaFive*sMat; // SpinMatrix * LatticeSpinMatrix sMat = GammaFive*sMat; // SpinMatrix * LatticeSpinMatrix scMat= adj(scMat); cMat= adj(cMat); cm=adj(cm); scm=adj(scm); // Foo = Foo+scalar; // LatticeColourMatrix+Scalar // Foo = Foo*scalar; // LatticeColourMatrix*Scalar // Foo = Foo-scalar; // LatticeColourMatrix-Scalar // Foo = scalar*Foo; // Scalar*LatticeColourMatrix // Foo = scalar+Foo; // Scalar+LatticeColourMatrix // Foo = scalar-Foo; // Scalar-LatticeColourMatrix LatticeComplex trscMat(&Fine); trscMat = trace(scMat); // Trace FooBar = Bar; /* { std::vector coor(4); for(int d=0;d<4;d++) coor[d] = 0; peekSite(cmat,Foo,coor); Foo = zero; pokeSite(cmat,Foo,coor); } random(Foo); */ lex_sites(Foo); //setCheckerboard(ShiftedCheck,rFoo); //setCheckerboard(ShiftedCheck,bFoo); // Lattice SU(3) x SU(3) FooBar = Foo * Bar; // Lattice 12x12 GEMM scFooBar = scFoo * scBar; // Benchmark some simple operations LatticeSU3 * Lattice SU3. double t0,t1,flops; double bytes; int ncall=100; int Nc = dpo::QCD::Nc; flops = ncall*1.0*volume*(8*Nc*Nc*Nc); bytes = ncall*1.0*volume*Nc*Nc *2*3*sizeof(dpo::Real); printf("%f flop and %f bytes\n",flops,bytes/ncall); FooBar = Foo * Bar; t0=usecond(); for(int i=0;iblack std::cout << "Shifting odd parities to even result"<red ShiftedCheck=zero; setCheckerboard(ShiftedCheck,bShifted); // Put them all together setCheckerboard(ShiftedCheck,rShifted); // and check the results (later) // Check results std::vector coor(4); for(coor[3]=0;coor[3] diff; std::vector shiftcoor = coor; shiftcoor[dir]=(shiftcoor[dir]+shift+latt_size[dir])%(latt_size[dir]/mpi_layout[dir]); std::vector rl(4); for(int dd=0;dd<4;dd++){ rl[dd] = latt_size[dd]/simd_layout[dd]/mpi_layout[dd]; } int lex = coor[0]%rl[0] + (coor[1]%rl[1])*rl[0] + (coor[2]%rl[2])*rl[0]*rl[1] + (coor[3]%rl[3])*rl[0]*rl[1]*rl[2]; lex += +1000*(coor[0]/rl[0]) +1000*(coor[1]/rl[1])*simd_layout[0] +1000*(coor[2]/rl[2])*simd_layout[0]*simd_layout[1] +1000*(coor[3]/rl[3])*simd_layout[0]*simd_layout[1]*simd_layout[2]; int lex_coor = shiftcoor[0]%rl[0] + (shiftcoor[1]%rl[1])*rl[0] + (shiftcoor[2]%rl[2])*rl[0]*rl[1] + (shiftcoor[3]%rl[3])*rl[0]*rl[1]*rl[2]; lex_coor += +1000*(shiftcoor[0]/rl[0]) +1000*(shiftcoor[1]/rl[1])*simd_layout[0] +1000*(shiftcoor[2]/rl[2])*simd_layout[0]*simd_layout[1] +1000*(shiftcoor[3]/rl[3])*simd_layout[0]*simd_layout[1]*simd_layout[2]; ColourMatrix foo; ColourMatrix bar; ColourMatrix shifted1; ColourMatrix shifted2; ColourMatrix shifted3; ColourMatrix foobar1; ColourMatrix foobar2; ColourMatrix mdiff,amdiff; peekSite(shifted1,Shifted,coor); peekSite(shifted2,Foo,shiftcoor); peekSite(shifted3,ShiftedCheck,coor); peekSite(foo,Foo,coor); mdiff = shifted1-shifted2; amdiff=adj(mdiff); ColourMatrix prod = amdiff*mdiff; TReal Ttr=real(trace(prod)); double nn=Ttr._internal._internal; if ( nn > 0 ) cout<<"Shift real trace fail "< 0 ) cout<<"Shift fail (shifted1/shifted2-ref) "< 0 ) cout<<"Shift rb fail (shifted3/shifted2-ref) "<