#include "Grid.h" //DEBUG #include "simd/Grid_vector_types.h" using namespace std; using namespace Grid; using namespace Grid::QCD; /* Grid_main.cc(232): error: no suitable user-defined conversion from "Grid::iScalar, 4>>" to "const Grid::iScalar>>" exists c_m = peekIdiot(scm,1,2); */ template auto peekIdiot(const vobj &rhs,int i,int j) -> decltype(peekIndex<2>(rhs,0,0)) { return peekIndex<2>(rhs,i,j); } template auto peekDumKopf(const vobj &rhs,int i,int j) -> decltype(peekIndex<3>(rhs,0,0)) { return peekIndex<3>(rhs,i,j); } template auto peekDumKopf(const vobj &rhs,int i) -> decltype(peekIndex<3>(rhs,0)) { return peekIndex<3>(rhs,i); } int main (int argc, char ** argv) { Grid_init(&argc,&argv); std::vector latt_size = GridDefaultLatt(); std::vector simd_layout = GridDefaultSimd(4,vComplexF::Nsimd()); std::vector mpi_layout = GridDefaultMpi(); latt_size.resize(4); #ifdef AVX512 for(int omp=128;omp<236;omp+=16){ #else for(int omp=1;omp<8;omp*=20){ #endif #ifdef OMP omp_set_num_threads(omp); #endif for(int lat=8;lat<=16;lat+=40){ latt_size[0] = lat; latt_size[1] = lat; latt_size[2] = lat; latt_size[3] = lat; double volume = latt_size[0]*latt_size[1]*latt_size[2]*latt_size[3]; GridCartesian Fine(latt_size,simd_layout,mpi_layout); GridRedBlackCartesian rbFine(latt_size,simd_layout,mpi_layout); GridParallelRNG FineRNG(&Fine); FineRNG.SeedRandomDevice(); LatticeColourMatrix Foo(&Fine); LatticeColourMatrix Bar(&Fine); LatticeSpinColourMatrix scFoo(&Fine); LatticeSpinColourMatrix scBar(&Fine); LatticeColourMatrix Shifted(&Fine); LatticeColourMatrix ShiftedCheck(&Fine); LatticeColourMatrix rShifted(&rbFine); LatticeColourMatrix bShifted(&rbFine); LatticeColourMatrix rFoo(&rbFine); LatticeColourMatrix bFoo(&rbFine); LatticeColourMatrix FooBar(&Fine); LatticeSpinColourMatrix scFooBar(&Fine); LatticeColourVector cVec(&Fine); LatticeSpinVector sVec(&Fine); LatticeSpinColourVector scVec(&Fine); LatticeColourMatrix cMat(&Fine); LatticeSpinMatrix sMat(&Fine); LatticeSpinColourMatrix scMat(&Fine); LatticeComplex scalar(&Fine); LatticeReal rscalar(&Fine); LatticeReal iscalar(&Fine); SpinMatrix GammaFive; iSpinMatrix iGammaFive; ColourMatrix cmat; random(FineRNG,Foo); gaussian(FineRNG,Bar); random(FineRNG,scFoo); random(FineRNG,scBar); random(FineRNG,cMat); random(FineRNG,sMat); random(FineRNG,scMat); random(FineRNG,cVec); random(FineRNG,sVec); random(FineRNG,scVec); fflush(stdout); cVec = cMat * cVec; // LatticeColourVector = LatticeColourMatrix * LatticeColourVector sVec = sMat * sVec; // LatticeSpinVector = LatticeSpinMatrix * LatticeSpinVector scVec= scMat * scVec;// LatticeSpinColourVector = LatticeSpinColourMatrix * LatticeSpinColourVector scVec= cMat * scVec; // LatticeSpinColourVector = LatticeColourMatrix * LatticeSpinColourVector scVec= sMat * scVec; // LatticeSpinColourVector = LatticeSpinMatrix * LatticeSpinColourVector cMat = outerProduct(cVec,cVec); scalar = localInnerProduct(cVec,cVec); scalar += scalar; scalar -= scalar; scalar *= scalar; add(scalar,scalar,scalar); sub(scalar,scalar,scalar); mult(scalar,scalar,scalar); mac(scalar,scalar,scalar); scalar = scalar+scalar; scalar = scalar-scalar; scalar = scalar*scalar; scalar=outerProduct(scalar,scalar); scalar=adj(scalar); // rscalar=real(scalar); // iscalar=imag(scalar); // scalar =cmplx(rscalar,iscalar); pokeIndex<1>(cVec,scalar,1); scalar=transpose(scalar); scalar=transposeIndex<1>(scalar); scalar=traceIndex<1>(scalar); scalar=peekIndex<1>(cVec,0); scalar=trace(scalar); scalar=localInnerProduct(cVec,cVec); scalar=localNorm2(cVec); // -=,+=,*=,() // add,+,sub,-,mult,mac,* // adj,conjugate // real,imag // transpose,transposeIndex // trace,traceIndex // peekIndex // innerProduct,outerProduct, // localNorm2 // localInnerProduct scMat = sMat*scMat; // LatticeSpinColourMatrix = LatticeSpinMatrix * LatticeSpinColourMatrix #ifdef SSE4 ///////// Tests the new class Grid_simd std::complex ctest(3.0,2.0); std::complex ctestf(3.0,2.0); MyComplexF TestMe1(1.0); // fills only real part MyComplexD TestMe2(ctest); MyComplexD TestMe3(ctest);// compiler generate conversion of basic types //MyRealF TestMe5(ctest);// Must generate compiler error MyRealD TestRe1(2.0); MyRealF TestRe2(3.0); vone(TestRe2); MyComplexF TestMe6(ctestf); MyComplexF TestMe7(ctestf); MyComplexD TheSum= TestMe2*TestMe3; MyComplexF TheSumF= TestMe6*TestMe7; double dsum[2]; _mm_store_pd(dsum, TheSum.v); for (int i =0; i< 2; i++) printf("%f\n", dsum[i]); MyComplexD TheSumI = timesMinusI(TheSum); MyComplexF TheSumIF = timesMinusI(TheSumF); float fsum[4]; _mm_store_ps(fsum, TheSumF.v); for (int i =0; i< 4; i++) printf("%f\n", fsum[i]); vstore(TheSumI, &ctest); std::complex sum = Reduce(TheSumF); std::cout << ctest<< std::endl; std::cout << sum<< std::endl; #endif /////////////////////// // Non-lattice (const objects) * Lattice ColourMatrix cm; SpinColourMatrix scm; vSpinColourMatrix vscm; Complex cplx(1.0); Integer myint=1; double mydouble=1.0; // vSpinColourMatrix vscm; scMat = cMat*scMat; scm = cm * scm; // SpinColourMatrix = ColourMatrix * SpinColourMatrix scm = scm *cm; // SpinColourMatrix = SpinColourMartix * ColourMatrix scm = GammaFive * scm ; // SpinColourMatrix = SpinMatrix * SpinColourMatrix scm = scm* GammaFive ; // SpinColourMatrix = SpinColourMatrix * SpinMatrix scm = scm*cplx; vscm = vscm*cplx; scMat = scMat*cplx; scm = cplx*scm; vscm = cplx*vscm; scMat = cplx*scMat; scm = myint*scm; vscm = myint*vscm; scMat = scMat*myint; scm = scm*mydouble; vscm = vscm*mydouble; scMat = scMat*mydouble; scMat = mydouble*scMat; cMat = mydouble*cMat; sMat = adj(sMat); // LatticeSpinMatrix adjoint sMat = iGammaFive*sMat; // SpinMatrix * LatticeSpinMatrix sMat = GammaFive*sMat; // SpinMatrix * LatticeSpinMatrix scMat= adj(scMat); cMat= adj(cMat); cm=adj(cm); scm=adj(scm); scm=transpose(scm); scm=transposeIndex<1>(scm); // Foo = Foo+scalar; // LatticeColourMatrix+Scalar // Foo = Foo*scalar; // LatticeColourMatrix*Scalar // Foo = Foo-scalar; // LatticeColourMatrix-Scalar // Foo = scalar*Foo; // Scalar*LatticeColourMatrix // Foo = scalar+Foo; // Scalar+LatticeColourMatrix // Foo = scalar-Foo; // Scalar-LatticeColourMatrix LatticeComplex trscMat(&Fine); trscMat = trace(scMat); // Trace { // Peek-ology and Poke-ology, with a little app-ology TComplex c; ColourMatrix c_m; SpinMatrix s_m; SpinColourMatrix sc_m; s_m = traceIndex<1>(sc_m); // Map to traceColour c_m = traceIndex<2>(sc_m); // map to traceSpin c = traceIndex<2>(s_m); c = traceIndex<1>(c_m); s_m = peekIndex<1>(scm,0,0); c_m = peekIndex<2>(scm,1,2); // c_m = peekSpin(scm,1,2); c_m = peekIdiot(scm,1,2); printf("c. Level %d\n",c_m.TensorLevel); printf("c. Level %d\n",c_m().TensorLevel); printf("c. Level %d\n",c_m()().TensorLevel); c_m()() = scm()(0,0); //ColourComponents of CM <= ColourComponents of SpinColourMatrix scm()(1,1) = cm()(); //ColourComponents of CM <= ColourComponents of SpinColourMatrix c = scm()(1,1)(1,2); scm()(1,1)(2,1) = c; pokeIndex<1> (c_m,c,0,0); } FooBar = Bar; /* { std::vector coor(4); for(int d=0;d<4;d++) coor[d] = 0; peekSite(cmat,Foo,coor); Foo = zero; pokeSite(cmat,Foo,coor); } random(Foo); */ lex_sites(Foo); Integer mm[4]; mm[0]=1; mm[1]=Fine._rdimensions[0]; mm[2]=Fine._ldimensions[0]*Fine._ldimensions[1]; mm[3]=Fine._ldimensions[0]*Fine._ldimensions[1]*Fine._ldimensions[2]; LatticeInteger lex(&Fine); lex=zero; for(int d=0;d<4;d++){ LatticeInteger coor(&Fine); LatticeCoordinate(coor,d); lex = lex + coor*mm[d]; } Bar = zero; Bar = where(lex<10,Foo,Bar); { std::vector coor(4); for(coor[3]=0;coor[3]black rShifted = Cshift(bFoo,dir,shift); // Shift black->red ShiftedCheck=zero; setCheckerboard(ShiftedCheck,bShifted); // Put them all together setCheckerboard(ShiftedCheck,rShifted); // and check the results (later) // Check results std::vector coor(4); for(coor[3]=0;coor[3] diff; std::vector shiftcoor = coor; shiftcoor[dir]=(shiftcoor[dir]+shift+latt_size[dir])%(latt_size[dir]/mpi_layout[dir]); std::vector rl(4); for(int dd=0;dd<4;dd++){ rl[dd] = latt_size[dd]/simd_layout[dd]/mpi_layout[dd]; } int lex = coor[0]%rl[0] + (coor[1]%rl[1])*rl[0] + (coor[2]%rl[2])*rl[0]*rl[1] + (coor[3]%rl[3])*rl[0]*rl[1]*rl[2]; lex += +1000*(coor[0]/rl[0]) +1000*(coor[1]/rl[1])*simd_layout[0] +1000*(coor[2]/rl[2])*simd_layout[0]*simd_layout[1] +1000*(coor[3]/rl[3])*simd_layout[0]*simd_layout[1]*simd_layout[2]; int lex_coor = shiftcoor[0]%rl[0] + (shiftcoor[1]%rl[1])*rl[0] + (shiftcoor[2]%rl[2])*rl[0]*rl[1] + (shiftcoor[3]%rl[3])*rl[0]*rl[1]*rl[2]; lex_coor += +1000*(shiftcoor[0]/rl[0]) +1000*(shiftcoor[1]/rl[1])*simd_layout[0] +1000*(shiftcoor[2]/rl[2])*simd_layout[0]*simd_layout[1] +1000*(shiftcoor[3]/rl[3])*simd_layout[0]*simd_layout[1]*simd_layout[2]; ColourMatrix foo; ColourMatrix bar; ColourMatrix shifted1; ColourMatrix shifted2; ColourMatrix shifted3; ColourMatrix foobar1; ColourMatrix foobar2; ColourMatrix mdiff,amdiff; peekSite(shifted1,Shifted,coor); peekSite(shifted2,Foo,shiftcoor); peekSite(shifted3,ShiftedCheck,coor); peekSite(foo,Foo,coor); mdiff = shifted1-shifted2; amdiff=adj(mdiff); ColourMatrix prod = amdiff*mdiff; Real Ttr=real(trace(prod)); double nn=Ttr; if ( nn > 0 ) cout<<"Shift real trace fail "< 0 ) cout<<"Shift fail (shifted1/shifted2-ref) "< 0 ) cout<<"Shift rb fail (shifted3/shifted2-ref) "<