/************************************************************************************* Grid physics library, www.github.com/paboyle/Grid Source file: ./tests/Test_stencil.cc Copyright (C) 2015 Author: Peter Boyle Author: Peter Boyle Author: paboyle This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 2 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. See the full license in the file "LICENSE" in the top level distribution directory *************************************************************************************/ /* END LEGAL */ #include using namespace std; using namespace Grid; ; int main(int argc, char ** argv) { Grid_init(&argc, &argv); // typedef LatticeColourMatrix Field; typedef LatticeComplex Field; typedef typename Field::vector_object vobj; typedef typename vobj::scalar_object sobj; auto latt_size = GridDefaultLatt(); auto simd_layout = GridDefaultSimd(Nd,vComplex::Nsimd()); auto mpi_layout = GridDefaultMpi(); double volume = latt_size[0]*latt_size[1]*latt_size[2]*latt_size[3]; GridCartesian Fine(latt_size,simd_layout,mpi_layout); GridRedBlackCartesian rbFine(&Fine); GridParallelRNG fRNG(&Fine); // fRNG.SeedFixedIntegers(std::vector({45,12,81,9}); std::vector seeds({1,2,3,4}); fRNG.SeedFixedIntegers(seeds); Field Foo(&Fine); Field Bar(&Fine); Field Check(&Fine); Field Diff(&Fine); LatticeComplex lex(&Fine); lex = Zero(); random(fRNG,Foo); gaussian(fRNG,Bar); for (int i=0;i directions(npoint,dir); std::vector displacements(npoint,disp); Stencil myStencil(&Fine,npoint,0,directions,displacements,0); Coordinate ocoor(4); for(int o=0;o compress; myStencil.HaloExchange(Foo,compress); Bar = Cshift(Foo,dir,disp); // Implement a stencil code that should agree with cshift! for(int i=0;ioSites();i++){ int permute_type; StencilEntry *SE; SE = myStencil.GetEntry(permute_type,0,i); autoView( check , Check, CpuWrite); autoView( foo , Foo, CpuRead); if ( SE->_is_local && SE->_permute ) permute(check[i],foo[SE->_offset],permute_type); else if (SE->_is_local) check[i] = foo[SE->_offset]; else { check[i] = myStencil.CommBuf()[SE->_offset]; // <-- this is illegal on most GPU setups, host accesses cudaMalloc memory // std::cout << " receive "< 0){ std::cout <<"Coor (" << coor[0]<<","< 1.0e-4) { autoView( check , Check, CpuRead); autoView( bar , Bar, CpuRead); for(int i=0;i 1.0e-4) exit(-1); } } std::cout< directions(npoint,dir); std::vector displacements(npoint,disp); Stencil EStencil(&rbFine,npoint,Even,directions,displacements,0); Stencil OStencil(&rbFine,npoint,Odd,directions,displacements,0); Coordinate ocoor(4); for(int o=0;o compress; Bar = Cshift(Foo,dir,disp); if ( disp & 0x1 ) { ECheck.Checkerboard() = Even; OCheck.Checkerboard() = Odd; } else { ECheck.Checkerboard() = Odd; OCheck.Checkerboard() = Even; } // Implement a stencil code that should agree with that darn cshift! EStencil.HaloExchange(EFoo,compress); for(int i=0;ioSites();i++){ int permute_type; StencilEntry *SE; SE = EStencil.GetEntry(permute_type,0,i); // std::cout << "Even source "<< i<<" -> " <_offset << " "<< SE->_is_local<_is_local && SE->_permute ) permute(ocheck[i],efoo[SE->_offset],permute_type); else if (SE->_is_local) ocheck[i] = efoo[SE->_offset]; else ocheck[i] = EStencil.CommBuf()[SE->_offset]; } OStencil.HaloExchange(OFoo,compress); for(int i=0;ioSites();i++){ int permute_type; StencilEntry *SE; SE = OStencil.GetEntry(permute_type,0,i); // std::cout << "ODD source "<< i<<" -> " <_offset << " "<< SE->_is_local<_is_local && SE->_permute ) permute(echeck[i],ofoo[SE->_offset],permute_type); else if (SE->_is_local) echeck[i] = ofoo[SE->_offset]; else echeck[i] = OStencil.CommBuf()[SE->_offset]; } setCheckerboard(Check,ECheck); setCheckerboard(Check,OCheck); Real nrmC = norm2(Check); Real nrmB = norm2(Bar); Diff = Check-Bar; Real nrm = norm2(Diff); std::cout< 0){ std::cout <<"Coor (" << coor[0]<<","< 1.0e-4) exit(-1); } } Grid_finalize(); }