mirror of
				https://github.com/paboyle/Grid.git
				synced 2025-10-31 03:54:33 +00:00 
			
		
		
		
	
		
			
				
	
	
		
			155 lines
		
	
	
		
			4.0 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			155 lines
		
	
	
		
			4.0 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| #include "Grid.h"
 | |
| 
 | |
| using namespace std;
 | |
| using namespace Grid;
 | |
| using namespace Grid::QCD;
 | |
| 
 | |
| 
 | |
| int main (int argc, char ** argv)
 | |
| {
 | |
|   Grid_init(&argc,&argv);
 | |
| 
 | |
|   std::vector<int> latt_size  (4);
 | |
|   std::vector<int> simd_layout(4);
 | |
|   std::vector<int> mpi_layout (4);
 | |
| 
 | |
|   int omp=1;
 | |
|   int lat=8;
 | |
| 
 | |
|   mpi_layout[0]=1;
 | |
|   mpi_layout[1]=1;
 | |
|   mpi_layout[2]=1;
 | |
|   mpi_layout[3]=1;
 | |
| 
 | |
|     latt_size[0] = lat;
 | |
|     latt_size[1] = lat;
 | |
|     latt_size[2] = lat;
 | |
|     latt_size[3] = lat;
 | |
|     double volume = latt_size[0]*latt_size[1]*latt_size[2]*latt_size[3];
 | |
|     
 | |
| #ifdef AVX512
 | |
|     simd_layout[0] = 1;
 | |
|     simd_layout[1] = 1;
 | |
|     simd_layout[2] = 2;
 | |
|     simd_layout[3] = 2;
 | |
| #endif
 | |
| #if defined (AVX1)|| defined (AVX2)
 | |
|     simd_layout[0] = 1;
 | |
|     simd_layout[1] = 1;
 | |
|     simd_layout[2] = 1;
 | |
|     simd_layout[3] = 2;
 | |
| #endif
 | |
| #if defined (SSE2)
 | |
|     simd_layout[0] = 1;
 | |
|     simd_layout[1] = 1;
 | |
|     simd_layout[2] = 1;
 | |
|     simd_layout[3] = 2;
 | |
| #endif
 | |
|     
 | |
|     GridCartesian Fine(latt_size,simd_layout,mpi_layout);
 | |
|     GridRedBlackCartesian rbFine(latt_size,simd_layout,mpi_layout);
 | |
|     
 | |
|     LatticeColourMatrix Foo(&Fine);
 | |
|     LatticeColourMatrix Bar(&Fine);
 | |
|     LatticeColourMatrix Check(&Fine);
 | |
|     LatticeColourMatrix Diff(&Fine);
 | |
|     
 | |
|     random(Foo);
 | |
|     gaussian(Bar);
 | |
| 
 | |
| 
 | |
|     for(int dir=0;dir<4;dir++){
 | |
|       for(int disp=0;disp<Fine._rdimensions[dir];disp++){
 | |
| 
 | |
| 	// start to test the Cartesian npoint stencil infrastructure
 | |
| 	int npoint=1;
 | |
| 	std::vector<int> directions(npoint,dir);
 | |
| 	std::vector<int> displacements(npoint,disp);
 | |
| 
 | |
| 	CartesianStencil myStencil(&Fine,npoint,0,directions,displacements);
 | |
| 
 | |
| 	printf("STENCIL: osites %d %d dir %d disp %d\n",Fine.oSites(),(int)myStencil._offsets[0].size(),dir,disp);
 | |
| 	std::vector<int> ocoor(4);
 | |
| 	for(int o=0;o<Fine.oSites();o++){
 | |
| 	  Fine.oCoorFromOindex(ocoor,o);
 | |
| 	  ocoor[dir]=(ocoor[dir]+disp)%Fine._rdimensions[dir];
 | |
| 	  int nbr = Fine.oIndexReduced(ocoor);
 | |
| 	  int stcl= myStencil._offsets[0][o];
 | |
| 	  if(nbr!=stcl){
 | |
| 	    printf("STENCIL: nbr %d stencil._offset %d\n",nbr,stcl);
 | |
| 	  }
 | |
| 	}
 | |
| 	
 | |
| 	printf("allocating %d buffers\n",myStencil._unified_buffer_size);
 | |
| 	fflush(stdout);
 | |
| 	std::vector<vColourMatrix,alignedAllocator<vColourMatrix> >  comm_buf(myStencil._unified_buffer_size);
 | |
| 	printf("calling halo exchange\n");fflush(stdout);
 | |
| 	myStencil.HaloExchange(Foo,comm_buf);
 | |
| 
 | |
| 	Bar = Cshift(Foo,dir,disp);
 | |
| 
 | |
| 	// Implement a stencil code that should agree with cshift!
 | |
| 	for(int i=0;i<Check._grid->oSites();i++){
 | |
| 
 | |
| 	  int offset = myStencil._offsets [0][i];
 | |
| 	  int  local = myStencil._is_local[0][i];
 | |
| 	  int permute_type = myStencil._permute_type[0];
 | |
| 	  int perm =myStencil._permute[0][i];
 | |
| 	  if ( local && perm )
 | |
| 	    permute(Check._odata[i],Foo._odata[offset],permute_type);
 | |
| 	  else if (local)
 | |
| 	    Check._odata[i] = Foo._odata[offset];
 | |
| 	  else 
 | |
| 	    Check._odata[i] = comm_buf[offset];
 | |
| 	  
 | |
| 
 | |
| 	}
 | |
| 
 | |
| 	Real nrmC = norm2(Check);
 | |
| 	Real nrmB = norm2(Bar);
 | |
| 	Real nrm = norm2(Check-Bar);
 | |
| 	printf("N2diff = %le (%le, %le) \n",nrm,nrmC,nrmB);fflush(stdout);
 | |
| 
 | |
| 	Real snrmC =0;
 | |
| 	Real snrmB =0;
 | |
| 	Real snrm  =0;
 | |
| 
 | |
| 	std::vector<int> coor(4);
 | |
| 	for(coor[3]=0;coor[3]<latt_size[3]/mpi_layout[3];coor[3]++){
 | |
| 	for(coor[2]=0;coor[2]<latt_size[2]/mpi_layout[2];coor[2]++){
 | |
| 	for(coor[1]=0;coor[1]<latt_size[1]/mpi_layout[1];coor[1]++){
 | |
| 	for(coor[0]=0;coor[0]<latt_size[0]/mpi_layout[0];coor[0]++){
 | |
| 
 | |
| 	  Complex diff;
 | |
| 	  ColourMatrix check,bar;
 | |
| 	  peekSite(check,Check,coor);
 | |
| 	  peekSite(bar,Bar,coor);
 | |
| 
 | |
| 	  for(int r=0;r<3;r++){
 | |
| 	  for(int c=0;c<3;c++){
 | |
|             diff =check._internal._internal[r][c]-bar._internal._internal[r][c];
 | |
|             double nn=real(conj(diff)*diff);
 | |
|             if ( nn > 0){
 | |
| 	      printf("Coor (%d %d %d %d) \t rc %d%d \t %le %le %le\n",
 | |
| 		     coor[0],coor[1],coor[2],coor[3],r,c,
 | |
| 		     nn,
 | |
| 		     real(check._internal._internal[r][c]),
 | |
| 		     real(bar._internal._internal[r][c])
 | |
| 		     );
 | |
| 	    }
 | |
| 	    snrmC=snrmC+real(conj(check._internal._internal[r][c])*check._internal._internal[r][c]);
 | |
| 	    snrmB=snrmB+real(conj(bar._internal._internal[r][c])*bar._internal._internal[r][c]);
 | |
| 	    snrm=snrm+nn;
 | |
| 	  }}
 | |
| 	 
 | |
| 	}}}}
 | |
| 
 | |
| 	printf("scalar N2diff = %le (%le, %le) \n",snrm,snrmC,snrmB);fflush(stdout);
 | |
| 
 | |
| 
 | |
|       }
 | |
|     }
 | |
| 
 | |
|  Grid_finalize();
 | |
| }
 |