mirror of
https://github.com/paboyle/Grid.git
synced 2024-11-14 01:35:36 +00:00
dc814f30da
Number of IO MPI tasks can be varied by selecting which dimensions use parallel IO and which dimensions use Serial send to boss I/O. Thus can neck down from, say 1024 nodes = 4x4x8x8 to {1,8,32,64,128,256,1024} nodes doing the I/O. Interpolates nicely between ALL nodes write their data, a single boss per time-plane in processor space [old UKQCD fortran code did this], and a single node doing all I/O. Not sure I have the transfer sizes big enough and am not overly convinced fstream is guaranteed to not give buffer inconsistencies unless I set streambuf size to zero. Practically it has worked on 8 tasks, 2x1x2x2 writing /cloning NERSC configurations on my MacOS + OpenMPI and Clang environment. It is VERY easy to switch to pwrite at a later date, and also easy to send x-strips around from each node in order to gather bigger chunks at the syscall level. That would push us up to the circa 8x 18*4*8 == 4KB size write chunk, and by taking, say, x/y non parallel we get to 16MB contiguous chunks written in multi 4KB transactions per IOnode in 64^3 lattices for configuration I/O. I suspect this is fine for system performance.
102 lines
4.3 KiB
C++
102 lines
4.3 KiB
C++
#include <Grid.h>
|
|
|
|
using namespace std;
|
|
using namespace Grid;
|
|
using namespace Grid::QCD;
|
|
|
|
int main (int argc, char ** argv)
|
|
{
|
|
Grid_init(&argc,&argv);
|
|
|
|
const int Ls=8;
|
|
|
|
GridCartesian * UGrid = SpaceTimeGrid::makeFourDimGrid(GridDefaultLatt(), GridDefaultSimd(Nd,vComplex::Nsimd()),GridDefaultMpi());
|
|
GridRedBlackCartesian * UrbGrid = SpaceTimeGrid::makeFourDimRedBlackGrid(UGrid);
|
|
|
|
GridCartesian * FGrid = SpaceTimeGrid::makeFiveDimGrid(Ls,UGrid);
|
|
GridRedBlackCartesian * FrbGrid = SpaceTimeGrid::makeFiveDimRedBlackGrid(Ls,UGrid);
|
|
|
|
///////////////////////////////////////////////////
|
|
// Construct a coarsened grid; utility for this?
|
|
///////////////////////////////////////////////////
|
|
std::vector<int> clatt = GridDefaultLatt();
|
|
for(int d=0;d<clatt.size();d++){
|
|
clatt[d] = clatt[d]/2;
|
|
}
|
|
GridCartesian *Coarse4d = SpaceTimeGrid::makeFourDimGrid(clatt, GridDefaultSimd(Nd,vComplex::Nsimd()),GridDefaultMpi());;
|
|
GridCartesian *Coarse5d = SpaceTimeGrid::makeFiveDimGrid(1,Coarse4d);
|
|
|
|
std::vector<int> seeds4({1,2,3,4});
|
|
std::vector<int> seeds5({5,6,7,8});
|
|
std::vector<int> cseeds({5,6,7,8});
|
|
GridParallelRNG RNG5(FGrid); RNG5.SeedFixedIntegers(seeds5);
|
|
GridParallelRNG RNG4(UGrid); RNG4.SeedFixedIntegers(seeds4);
|
|
GridParallelRNG CRNG(Coarse5d);CRNG.SeedFixedIntegers(cseeds);
|
|
|
|
LatticeFermion src(FGrid); gaussian(RNG5,src);
|
|
LatticeFermion result(FGrid); result=zero;
|
|
LatticeFermion ref(FGrid); ref=zero;
|
|
LatticeFermion tmp(FGrid);
|
|
LatticeFermion err(FGrid);
|
|
LatticeGaugeField Umu(UGrid);
|
|
|
|
NerscField header;
|
|
std::string file("./ckpoint_lat.400");
|
|
NerscIO::readConfiguration(Umu,header,file);
|
|
|
|
// SU3::ColdConfiguration(RNG4,Umu);
|
|
// SU3::TepidConfiguration(RNG4,Umu);
|
|
// SU3::HotConfiguration(RNG4,Umu);
|
|
// Umu=zero;
|
|
|
|
RealD mass=0.1;
|
|
RealD M5=1.5;
|
|
|
|
std::cout<<GridLogMessage << "**************************************************"<< std::endl;
|
|
std::cout<<GridLogMessage << "Building g5R5 hermitian DWF operator" <<std::endl;
|
|
std::cout<<GridLogMessage << "**************************************************"<< std::endl;
|
|
DomainWallFermionR Ddwf(Umu,*FGrid,*FrbGrid,*UGrid,*UrbGrid,mass,M5);
|
|
Gamma5R5HermitianLinearOperator<DomainWallFermionR,LatticeFermion> HermIndefOp(Ddwf);
|
|
|
|
const int nbasis = 8;
|
|
|
|
typedef Aggregation<vSpinColourVector,vTComplex,nbasis> Subspace;
|
|
typedef CoarsenedMatrix<vSpinColourVector,vTComplex,nbasis> LittleDiracOperator;
|
|
typedef LittleDiracOperator::CoarseVector CoarseVector;
|
|
|
|
std::cout<<GridLogMessage << "**************************************************"<< std::endl;
|
|
std::cout<<GridLogMessage << "Calling Aggregation class to build subspace" <<std::endl;
|
|
std::cout<<GridLogMessage << "**************************************************"<< std::endl;
|
|
MdagMLinearOperator<DomainWallFermionR,LatticeFermion> HermDefOp(Ddwf);
|
|
Subspace Aggregates(Coarse5d,FGrid);
|
|
Aggregates.CreateSubspace(RNG5,HermDefOp);
|
|
|
|
|
|
LittleDiracOperator LittleDiracOp(*Coarse5d);
|
|
LittleDiracOp.CoarsenOperator(FGrid,HermIndefOp,Aggregates);
|
|
|
|
CoarseVector c_src (Coarse5d);
|
|
CoarseVector c_res (Coarse5d);
|
|
gaussian(CRNG,c_src);
|
|
c_res=zero;
|
|
|
|
std::cout<<GridLogMessage << "**************************************************"<< std::endl;
|
|
std::cout<<GridLogMessage << "Solving mdagm-CG on coarse space "<< std::endl;
|
|
std::cout<<GridLogMessage << "**************************************************"<< std::endl;
|
|
MdagMLinearOperator<LittleDiracOperator,CoarseVector> PosdefLdop(LittleDiracOp);
|
|
ConjugateGradient<CoarseVector> CG(1.0e-6,10000);
|
|
CG(PosdefLdop,c_src,c_res);
|
|
|
|
std::cout<<GridLogMessage << "**************************************************"<< std::endl;
|
|
std::cout<<GridLogMessage << "Solving indef-MCR on coarse space "<< std::endl;
|
|
std::cout<<GridLogMessage << "**************************************************"<< std::endl;
|
|
HermitianLinearOperator<LittleDiracOperator,CoarseVector> HermIndefLdop(LittleDiracOp);
|
|
ConjugateResidual<CoarseVector> MCR(1.0e-6,10000);
|
|
MCR(HermIndefLdop,c_src,c_res);
|
|
|
|
std::cout<<GridLogMessage << "**************************************************"<< std::endl;
|
|
std::cout<<GridLogMessage << "Done "<< std::endl;
|
|
std::cout<<GridLogMessage << "**************************************************"<< std::endl;
|
|
Grid_finalize();
|
|
}
|