mirror of
				https://github.com/paboyle/Grid.git
				synced 2025-10-25 02:04:48 +01:00 
			
		
		
		
	
		
			
				
	
	
		
			1291 lines
		
	
	
		
			47 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			1291 lines
		
	
	
		
			47 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| /*************************************************************************************
 | |
| 
 | |
|     Grid physics library, www.github.com/paboyle/Grid 
 | |
| 
 | |
|     Source file: ./tests/Test_dwf_hdcr.cc
 | |
| 
 | |
|     Copyright (C) 2015
 | |
| 
 | |
| Author: Peter Boyle <paboyle@ph.ed.ac.uk>
 | |
| 
 | |
|     This program is free software; you can redistribute it and/or modify
 | |
|     it under the terms of the GNU General Public License as published by
 | |
|     the Free Software Foundation; either version 2 of the License, or
 | |
|     (at your option) any later version.
 | |
| 
 | |
|     This program is distributed in the hope that it will be useful,
 | |
|     but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
|     MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | |
|     GNU General Public License for more details.
 | |
| 
 | |
|     You should have received a copy of the GNU General Public License along
 | |
|     with this program; if not, write to the Free Software Foundation, Inc.,
 | |
|     51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
 | |
| 
 | |
|     See the full license in the file "LICENSE" in the top level distribution directory
 | |
|     *************************************************************************************/
 | |
|     /*  END LEGAL */
 | |
| #include <Grid/Grid.h>
 | |
| #include <Grid/algorithms/iterative/PrecGeneralisedConjugateResidual.h>
 | |
| #include <Grid/algorithms/iterative/PrecGeneralisedConjugateResidualNonHermitian.h>
 | |
| #include <Grid/algorithms/iterative/BiCGSTAB.h>
 | |
| 
 | |
| using namespace std;
 | |
| using namespace Grid;
 | |
| 
 | |
| // TODO
 | |
| //
 | |
| // Coarse Grid axpby_ssp_pminus // Inherit from spProj5pm
 | |
| // Coarse Grid axpby_ssp_pplus
 | |
| 
 | |
| template<class Field,class Coeff_t>
 | |
| class CayleyBase : public SparseMatrixBase<Field> 
 | |
| {
 | |
| public:
 | |
|   int Ls;
 | |
|   //    protected:
 | |
|   RealD mass;
 | |
|   RealD M5;
 | |
|   // Save arguments to SetCoefficientsInternal
 | |
|   Vector<Coeff_t> _gamma;
 | |
|   RealD                _zolo_hi;
 | |
|   RealD                _b;
 | |
|   RealD                _c;
 | |
| 
 | |
|   // Cayley form Moebius (tanh and zolotarev)
 | |
|   Vector<Coeff_t> omega;
 | |
|   Vector<Coeff_t> bs;    // S dependent coeffs
 | |
|   Vector<Coeff_t> cs;
 | |
|   Vector<Coeff_t> as;
 | |
|   // For preconditioning Cayley form
 | |
|   Vector<Coeff_t> bee;
 | |
|   Vector<Coeff_t> cee;
 | |
|   Vector<Coeff_t> aee;
 | |
|   Vector<Coeff_t> beo;
 | |
|   Vector<Coeff_t> ceo;
 | |
|   Vector<Coeff_t> aeo;
 | |
|   // LDU factorisation of the eeoo matrix
 | |
|   Vector<Coeff_t> lee;
 | |
|   Vector<Coeff_t> leem;
 | |
|   Vector<Coeff_t> uee;
 | |
|   Vector<Coeff_t> ueem;
 | |
|   Vector<Coeff_t> dee;
 | |
| public:
 | |
|   CayleyBase(RealD _M5, RealD _mass, int _Ls, RealD b_, RealD c_) :
 | |
|     M5(_M5),
 | |
|     mass(_mass),
 | |
|     Ls(_Ls),
 | |
|     _b(b_),
 | |
|     _c(c_)
 | |
|   {
 | |
|     RealD eps = 1.0;
 | |
|     Approx::zolotarev_data *zdata = Approx::higham(eps,this->Ls);// eps is ignored for higham
 | |
|     this->SetCoefficientsTanh(zdata,1.0,0.0);
 | |
|     Approx::zolotarev_free(zdata);
 | |
|   }
 | |
|   /////////////////////////////////////////////////////////
 | |
|   // Replicates functionality
 | |
|   // Use a common base class approach
 | |
|   /////////////////////////////////////////////////////////
 | |
|   // Tanh
 | |
|   void SetCoefficientsTanh(Approx::zolotarev_data *zdata,RealD b,RealD c)
 | |
|   {
 | |
|     Vector<Coeff_t> gamma(this->Ls);
 | |
|     for(int s=0;s<this->Ls;s++) gamma[s] = zdata->gamma[s];
 | |
|     SetCoefficientsInternal(1.0,gamma,b,c);
 | |
|   }
 | |
|   //Zolo
 | |
|   void SetCoefficientsZolotarev(RealD zolo_hi,Approx::zolotarev_data *zdata,RealD b,RealD c)
 | |
|   {
 | |
|     Vector<Coeff_t> gamma(this->Ls);
 | |
|     for(int s=0;s<this->Ls;s++) gamma[s] = zdata->gamma[s];
 | |
|     SetCoefficientsInternal(zolo_hi,gamma,b,c);
 | |
|   }
 | |
|   //Zolo
 | |
|   void SetCoefficientsInternal(RealD zolo_hi,Vector<Coeff_t> & gamma,RealD b,RealD c)
 | |
|   {
 | |
|     int Ls=this->Ls;
 | |
| 
 | |
|     ///////////////////////////////////////////////////////////
 | |
|     // The Cayley coeffs (unprec)
 | |
|     ///////////////////////////////////////////////////////////
 | |
|     assert(gamma.size()==Ls);
 | |
| 
 | |
|     omega.resize(Ls);
 | |
|     bs.resize(Ls);
 | |
|     cs.resize(Ls);
 | |
|     as.resize(Ls);
 | |
|     
 | |
|     double bpc = b+c;
 | |
|     double bmc = b-c;
 | |
|     _b = b;
 | |
|     _c = c;
 | |
|     _gamma  = gamma; // Save the parameters so we can change mass later.
 | |
|     _zolo_hi= zolo_hi;
 | |
|     for(int i=0; i < Ls; i++){
 | |
|       as[i] = 1.0;
 | |
|       omega[i] = _gamma[i]*_zolo_hi; //NB reciprocal relative to Chroma NEF code
 | |
|       assert(omega[i]!=Coeff_t(0.0));
 | |
|       bs[i] = 0.5*(bpc/omega[i] + bmc);
 | |
|       cs[i] = 0.5*(bpc/omega[i] - bmc);
 | |
|     }
 | |
| 
 | |
|     ////////////////////////////////////////////////////////
 | |
|     // Constants for the preconditioned matrix Cayley form
 | |
|     ////////////////////////////////////////////////////////
 | |
|     bee.resize(Ls);
 | |
|     cee.resize(Ls);
 | |
|     beo.resize(Ls);
 | |
|     ceo.resize(Ls);
 | |
|     
 | |
|     for(int i=0;i<Ls;i++){
 | |
|       bee[i]=as[i]*(bs[i]*(4.0-this->M5) +1.0);     
 | |
|       assert(bee[i]!=Coeff_t(0.0));
 | |
|       cee[i]=as[i]*(1.0-cs[i]*(4.0-this->M5));
 | |
|       beo[i]=as[i]*bs[i];
 | |
|       ceo[i]=-as[i]*cs[i];
 | |
|     }
 | |
|     aee.resize(Ls);
 | |
|     aeo.resize(Ls);
 | |
|     for(int i=0;i<Ls;i++){
 | |
|       aee[i]=cee[i];
 | |
|       aeo[i]=ceo[i];
 | |
|     }
 | |
|     
 | |
|     //////////////////////////////////////////
 | |
|     // LDU decomposition of eeoo
 | |
|     //////////////////////////////////////////
 | |
|     dee.resize(Ls);
 | |
|     lee.resize(Ls);
 | |
|     leem.resize(Ls);
 | |
|     uee.resize(Ls);
 | |
|     ueem.resize(Ls);
 | |
|   
 | |
|     for(int i=0;i<Ls;i++){
 | |
|       
 | |
|       dee[i] = bee[i];
 | |
|       
 | |
|       if ( i < Ls-1 ) {
 | |
| 	
 | |
| 	assert(bee[i]!=Coeff_t(0.0));
 | |
| 	assert(bee[0]!=Coeff_t(0.0));
 | |
|       
 | |
| 	lee[i] =-cee[i+1]/bee[i]; // sub-diag entry on the ith column
 | |
|       
 | |
| 	leem[i]=mass*cee[Ls-1]/bee[0];
 | |
| 	for(int j=0;j<i;j++) {
 | |
| 	  assert(bee[j+1]!=Coeff_t(0.0));
 | |
| 	  leem[i]*= aee[j]/bee[j+1];
 | |
| 	}
 | |
|       
 | |
| 	uee[i] =-aee[i]/bee[i];   // up-diag entry on the ith row
 | |
| 	
 | |
| 	ueem[i]=mass;
 | |
| 	for(int j=1;j<=i;j++) ueem[i]*= cee[j]/bee[j];
 | |
| 	ueem[i]*= aee[0]/bee[0];
 | |
|       
 | |
|       } else { 
 | |
| 	lee[i] =0.0;
 | |
| 	leem[i]=0.0;
 | |
| 	uee[i] =0.0;
 | |
| 	ueem[i]=0.0;
 | |
|       }
 | |
|     }
 | |
|     
 | |
|     { 
 | |
|       Coeff_t delta_d=mass*cee[Ls-1];
 | |
|       for(int j=0;j<Ls-1;j++) {
 | |
| 	assert(bee[j] != Coeff_t(0.0));
 | |
| 	delta_d *= cee[j]/bee[j];
 | |
|       }
 | |
|       dee[Ls-1] += delta_d;
 | |
|     }  
 | |
|   };
 | |
| 
 | |
|   //////////////////////////////
 | |
|   // M and Mdag
 | |
|   //////////////////////////////
 | |
|   virtual  void Mdiag    (const Field &in, Field &out) {assert(0);}
 | |
|   virtual  void Mdir     (const Field &in, Field &out,int dir, int disp){assert(0);};
 | |
|   virtual  void MdirAll  (const Field &in, std::vector<Field> &out){assert(0);};
 | |
|   virtual  void DW       (const Field &psi, Field &chi)=0;
 | |
|   virtual  void DWDag    (const Field &psi, Field &chi)=0;
 | |
| 
 | |
|   void M    (const Field &psi, Field &chi)
 | |
|   {
 | |
|     Field Din(psi.Grid());
 | |
|     Meooe5D(psi,Din);
 | |
|     DW(Din,chi);
 | |
|     axpby(chi,1.0,1.0,chi,psi); 
 | |
|     M5D(psi,chi);
 | |
|   }
 | |
|   void Mdag (const Field &psi, Field &chi)
 | |
|   {
 | |
|     Field Din(psi.Grid());
 | |
|     DWDag(psi,Din); 
 | |
|     MeooeDag5D(Din,chi);
 | |
|     M5Ddag(psi,chi);
 | |
|     axpby (chi,1.0,1.0,chi,psi); 
 | |
|   }
 | |
|   /////////////////////////////////
 | |
|   // P and Pdag - might be needed
 | |
|   /////////////////////////////////
 | |
|   void P(const Field &psi, Field &chi)
 | |
|   {
 | |
|     int Ls= this->Ls;
 | |
|     chi=Zero();
 | |
|     for(int s=0;s<Ls;s++){
 | |
|       axpby_ssp_pminus(chi,1.0,chi,1.0,psi,s,s);
 | |
|       axpby_ssp_pplus (chi,1.0,chi,1.0,psi,s,(s+1)%Ls);
 | |
|     }
 | |
|   }
 | |
|   void Pdag(const Field &psi, Field &chi)
 | |
|   {
 | |
|     int Ls= this->Ls;
 | |
|     chi=Zero();
 | |
|     for(int s=0;s<Ls;s++){
 | |
|       axpby_ssp_pminus(chi,1.0,chi,1.0,psi,s,s);
 | |
|       axpby_ssp_pplus (chi,1.0,chi,1.0,psi,s,(s-1+Ls)%Ls);
 | |
|     }
 | |
|   }
 | |
|   ////////////////////////////////////////////////////////
 | |
|   // Depends: Dw, M5D,  M5Ddag, Meooe5D, MeooeDag5D,
 | |
|   ////////////////////////////////////////////////////////
 | |
|   void M5D   (const Field &psi, Field &chi)
 | |
|   {
 | |
|     int Ls=this->Ls;
 | |
|     Vector<Coeff_t> diag (Ls,1.0);
 | |
|     Vector<Coeff_t> upper(Ls,-1.0); upper[Ls-1]=mass;
 | |
|     Vector<Coeff_t> lower(Ls,-1.0); lower[0]   =mass;
 | |
|     M5D(psi,chi,chi,lower,diag,upper);
 | |
|   }
 | |
|   void M5Ddag (const Field &psi, Field &chi)
 | |
|   {
 | |
|     int Ls=this->Ls;
 | |
|     Vector<Coeff_t> diag(Ls,1.0);
 | |
|     Vector<Coeff_t> upper(Ls,-1.0);
 | |
|     Vector<Coeff_t> lower(Ls,-1.0);
 | |
|     upper[Ls-1]=-mass*upper[Ls-1];
 | |
|     lower[0]   =-mass*lower[0];
 | |
|     M5Ddag(psi,chi,chi,lower,diag,upper);
 | |
|   }
 | |
|   void Meooe5D    (const Field &psi, Field &Din)
 | |
|   {
 | |
|     int Ls=this->Ls;
 | |
|     Vector<Coeff_t> diag = bs;
 | |
|     Vector<Coeff_t> upper= cs;
 | |
|     Vector<Coeff_t> lower= cs; 
 | |
|     upper[Ls-1]=-mass*upper[Ls-1];
 | |
|     lower[0]   =-mass*lower[0];
 | |
|     M5D(psi,psi,Din,lower,diag,upper);
 | |
|   }
 | |
|   void MeooeDag5D    (const Field &psi, Field &Din)
 | |
|   {
 | |
|     int Ls=this->Ls;
 | |
|     Vector<Coeff_t> diag =bs;
 | |
|     Vector<Coeff_t> upper=cs;
 | |
|     Vector<Coeff_t> lower=cs; 
 | |
|     
 | |
|     for (int s=0;s<Ls;s++){
 | |
|       if ( s== 0 ) {
 | |
| 	upper[s] = cs[s+1];
 | |
| 	lower[s] =-mass*cs[Ls-1];
 | |
|       } else if ( s==(Ls-1) ) { 
 | |
| 	upper[s] =-mass*cs[0];
 | |
| 	lower[s] = cs[s-1];
 | |
|       } else { 
 | |
| 	upper[s] = cs[s+1];
 | |
| 	lower[s] = cs[s-1];
 | |
|       }
 | |
|       upper[s] = conjugate(upper[s]);
 | |
|       lower[s] = conjugate(lower[s]);
 | |
|       diag[s]  = conjugate(diag[s]);
 | |
|     }
 | |
|     M5Ddag(psi,psi,Din,lower,diag,upper);
 | |
|   }
 | |
| 
 | |
|   void M5D(const Field &psi_i,
 | |
| 	   const Field &phi_i, 
 | |
| 	   Field &chi_i,
 | |
| 	   Vector<Coeff_t> &lower,
 | |
| 	   Vector<Coeff_t> &diag,
 | |
| 	   Vector<Coeff_t> &upper)
 | |
|   {
 | |
|     chi_i.Checkerboard()=psi_i.Checkerboard();
 | |
|     GridBase *grid=psi_i.Grid();
 | |
|     autoView(psi , psi_i,AcceleratorRead);
 | |
|     autoView(phi , phi_i,AcceleratorRead);
 | |
|     autoView(chi , chi_i,AcceleratorWrite);
 | |
|     assert(phi.Checkerboard() == psi.Checkerboard());
 | |
| 
 | |
|     auto pdiag = &diag[0];
 | |
|     auto pupper = &upper[0];
 | |
|     auto plower = &lower[0];
 | |
| 
 | |
|     int Ls =this->Ls;
 | |
|     
 | |
|     // 10 = 3 complex mult + 2 complex add
 | |
|     // Flops = 10.0*(Nc*Ns) *Ls*vol (/2 for red black counting)
 | |
|     uint64_t nloop = grid->oSites()/Ls;
 | |
| 
 | |
|     const int Nsimd = Field::vector_type::Nsimd();
 | |
|     accelerator_for(sss,nloop,Nsimd,{
 | |
| 	uint64_t ss= sss*Ls;
 | |
| 	typedef decltype(coalescedRead(psi[0])) spinor;
 | |
| 	spinor tmp1, tmp2;
 | |
| 	for(int s=0;s<Ls;s++){
 | |
| 	  uint64_t idx_u = ss+((s+1)%Ls);
 | |
| 	  uint64_t idx_l = ss+((s+Ls-1)%Ls);
 | |
| 	  spProj5m(tmp1,psi(idx_u)); // Need routines for this
 | |
| 	  spProj5p(tmp2,psi(idx_l));
 | |
| 	  coalescedWrite(chi[ss+s],pdiag[s]*phi(ss+s)+pupper[s]*tmp1+plower[s]*tmp2);
 | |
| 	}
 | |
|       });
 | |
|   }
 | |
|   void M5Ddag(const Field &psi_i,
 | |
| 	      const Field &phi_i, 
 | |
| 	      Field &chi_i,
 | |
| 	      Vector<Coeff_t> &lower,
 | |
| 	      Vector<Coeff_t> &diag,
 | |
| 	      Vector<Coeff_t> &upper)
 | |
|   {
 | |
|     chi_i.Checkerboard()=psi_i.Checkerboard();
 | |
|     GridBase *grid=psi_i.Grid();
 | |
|     autoView(psi , psi_i,AcceleratorRead);
 | |
|     autoView(phi , phi_i,AcceleratorRead);
 | |
|     autoView(chi , chi_i,AcceleratorWrite);
 | |
|     assert(phi.Checkerboard() == psi.Checkerboard());
 | |
|     
 | |
|     auto pdiag = &diag[0];
 | |
|     auto pupper = &upper[0];
 | |
|     auto plower = &lower[0];
 | |
|     
 | |
|     int Ls=this->Ls;
 | |
|     
 | |
|     uint64_t nloop = grid->oSites()/Ls;
 | |
|     const int Nsimd = Field::vector_type::Nsimd();
 | |
|     accelerator_for(sss,nloop,Nsimd,{
 | |
| 	uint64_t ss=sss*Ls;
 | |
| 	typedef decltype(coalescedRead(psi[0])) spinor;
 | |
| 	spinor tmp1,tmp2;
 | |
| 	for(int s=0;s<Ls;s++){
 | |
| 	  uint64_t idx_u = ss+((s+1)%Ls);
 | |
| 	  uint64_t idx_l = ss+((s+Ls-1)%Ls);
 | |
| 	  spProj5p(tmp1,psi(idx_u));
 | |
| 	  spProj5m(tmp2,psi(idx_l));
 | |
| 	  coalescedWrite(chi[ss+s],pdiag[s]*phi(ss+s)+pupper[s]*tmp1+plower[s]*tmp2);
 | |
| 	}
 | |
|       });
 | |
|   }
 | |
| };
 | |
| 
 | |
| template<class Fobj,class CComplex,int nbasis>
 | |
| class CoarseCayleyFermion  : public CayleyBase< Lattice<iVector<CComplex,nbasis > > , ComplexD >
 | |
| {
 | |
| public:
 | |
|   typedef iVector<CComplex,nbasis >           siteVector;
 | |
|   typedef Lattice<CComplex >                  CoarseComplexField;
 | |
|   typedef Lattice<siteVector>                 CoarseVector;
 | |
|   typedef Lattice<iMatrix<CComplex,nbasis > > CoarseMatrix;
 | |
|   typedef iMatrix<CComplex,nbasis >  Cobj;
 | |
|   typedef Lattice< CComplex >   CoarseScalar; // used for inner products on fine field
 | |
|   typedef Lattice<Fobj >        FineField;
 | |
| 
 | |
|   // Similar to the CoarseOperator but add 5D support.
 | |
|   Geometry  geom;
 | |
|   GridBase *Coarse5D;
 | |
|   GridBase *Coarse4D;
 | |
|   CartesianStencil<siteVector,siteVector,DefaultImplParams> Stencil; 
 | |
|   CoarsenedMatrix<Fobj,CComplex,nbasis> &Dw;
 | |
| 
 | |
|   GridBase * Grid(void)         { return Coarse5D; };   // this is all the linalg routines need to know
 | |
| 
 | |
|   CoarseCayleyFermion(GridCartesian &CoarseGrid4,
 | |
| 		      GridCartesian &CoarseGrid5,
 | |
| 		      CoarsenedMatrix<Fobj,CComplex,nbasis> &_Dw,
 | |
| 		      RealD M5, RealD mass, int Ls, RealD b, RealD c) :
 | |
|     CayleyBase<CoarseVector,ComplexD>(M5,mass,Ls,b,c),
 | |
|     Coarse4D(&CoarseGrid4),
 | |
|     Coarse5D(&CoarseGrid5),
 | |
|     Dw(_Dw),
 | |
|     geom(CoarseGrid5._ndimension),
 | |
|     Stencil( &CoarseGrid5,geom.npoint,Even,geom.directions,geom.displacements,DefaultImplParams())
 | |
|   { 
 | |
|   };
 | |
| 
 | |
| public:
 | |
|   void Project( CoarseVector &C )
 | |
|   {
 | |
|     const int Nsimd = CComplex::Nsimd();
 | |
|     autoView(Cv,C, AcceleratorWrite);
 | |
|     int Ls = this->Ls;
 | |
|     for(int s=0;s<Ls;s++){
 | |
|       accelerator_for(sU, Coarse4D->oSites(), Nsimd, {
 | |
| 	  int sF= sU*Ls+s;
 | |
| 	  auto tmp = coalescedRead(Cv[sF]);
 | |
| 	  coalescedWrite(Cv[sF],tmp);
 | |
|       });
 | |
|     }
 | |
|   }
 | |
|   ////////////////////////////////////////////////
 | |
|   // This is specific to Coarse Grid Cayley
 | |
|   ////////////////////////////////////////////////
 | |
|   virtual  void Mdiag    (const CoarseVector &in, CoarseVector &out)
 | |
|   {
 | |
|     std::vector<CoarseVector> allout(9,in.Grid());
 | |
|     this->MdirAll(in,allout);
 | |
|     out = allout[8];
 | |
|   }
 | |
|   virtual  void Mdir     (const CoarseVector &in, CoarseVector &out,int dir, int disp)
 | |
|   {
 | |
|     assert(0);
 | |
|   }
 | |
|   virtual  void MdirAll  (const CoarseVector &in, std::vector<CoarseVector> &out)
 | |
|   {
 | |
|     conformable(Coarse5D,in.Grid());
 | |
| 
 | |
|     SimpleCompressor<siteVector> compressor;
 | |
| 
 | |
|     Stencil.HaloExchange(in,compressor);
 | |
|     typedef LatticeView<Cobj> Aview;
 | |
|       
 | |
|     const int Nsimd = CComplex::Nsimd();
 | |
|     
 | |
|     // Ls loop for2D
 | |
|     int Ls=this->Ls;
 | |
| 
 | |
|     siteVector *CBp=Stencil.CommBuf();			
 | |
| 
 | |
|     //    int ptype;
 | |
|     //    int nb2=nbasis/2;
 | |
|     
 | |
|     autoView(in_v ,   in, AcceleratorRead);
 | |
|     autoView(st, Stencil, AcceleratorRead);
 | |
|     for(int point=0;point<geom.npoint;point++){
 | |
|       
 | |
|       autoView(out_v,  out[point], AcceleratorWrite);
 | |
|       autoView(Aview,Dw.A[point],AcceleratorRead);
 | |
| 
 | |
|       accelerator_for2d(sF, Coarse5D->oSites(), b, nbasis, Nsimd, {
 | |
| 
 | |
| 	  typedef decltype(coalescedRead(in_v[0])) calcVector;
 | |
| 	  typedef decltype(coalescedRead(in_v[0](0))) calcComplex;
 | |
| 	  int sU = sF/Ls;
 | |
| 	  //	  int  s = sF%Ls;
 | |
| 
 | |
| 	  calcComplex res = Zero();
 | |
| 	  calcVector  nbr;
 | |
| 	  int ptype;
 | |
| 	    
 | |
| 	  StencilEntry *SE=st.GetEntry(ptype,point,sF);
 | |
| 	  
 | |
| 	  if(SE->_is_local) { 
 | |
| 	    nbr = coalescedReadPermute(in_v[SE->_offset],ptype,SE->_permute);
 | |
| 	  } else {
 | |
| 	    nbr = coalescedRead(CBp[SE->_offset]);
 | |
| 	  }
 | |
| 	  acceleratorSynchronise();
 | |
| 
 | |
| 	  for(int bb=0;bb<nbasis;bb++) {
 | |
| 	    res = res + coalescedRead(Aview[sU](b,bb))*nbr(bb);
 | |
| 	  }
 | |
| 	  
 | |
| 	  coalescedWrite(out_v[sF](b),res);
 | |
|       });
 | |
|     }      
 | |
|   }
 | |
|   void DW (const CoarseVector &in, CoarseVector &out)
 | |
|   {
 | |
|     conformable(Coarse5D,in.Grid());
 | |
|     conformable(in.Grid(),out.Grid());
 | |
| 
 | |
|     SimpleCompressor<siteVector> compressor;
 | |
| 
 | |
|     Stencil.HaloExchange(in,compressor);
 | |
|     typedef LatticeView<Cobj> Aview;
 | |
|       
 | |
|     const int Nsimd = CComplex::Nsimd();
 | |
|     
 | |
|     // Ls loop for2D
 | |
|     int Ls=this->Ls;
 | |
| 
 | |
|     Vector<Aview> AcceleratorViewContainer;
 | |
|     for(int p=0;p<geom.npoint;p++) AcceleratorViewContainer.push_back(Dw.A[p].View(AcceleratorRead));
 | |
|     Aview *Aview_p = & AcceleratorViewContainer[0];
 | |
|     autoView(in_v ,   in, AcceleratorRead);
 | |
|     autoView(out_v,  out, AcceleratorWrite);
 | |
|     autoView(st, Stencil, AcceleratorRead);
 | |
|     siteVector *CBp=Stencil.CommBuf();			
 | |
| 
 | |
|     //    int ptype;
 | |
|     //    int nb2=nbasis/2;
 | |
|     accelerator_for2d(sF, Coarse5D->oSites(), b, nbasis, Nsimd, {
 | |
| 
 | |
|       typedef decltype(coalescedRead(in_v[0])) calcVector;
 | |
|       typedef decltype(coalescedRead(in_v[0](0))) calcComplex;
 | |
|       int sU = sF/Ls;
 | |
|       //      int  s = sF%Ls;
 | |
| 
 | |
|       calcComplex res = Zero();
 | |
| 
 | |
|       {
 | |
|       	calcVector  nbr;
 | |
| 	int ptype;
 | |
| 
 | |
| 	for(int point=0;point<geom.npoint;point++){
 | |
| 
 | |
| 	  StencilEntry *SE=st.GetEntry(ptype,point,sF);
 | |
| 	  
 | |
| 	  if(SE->_is_local) { 
 | |
| 	    nbr = coalescedReadPermute(in_v[SE->_offset],ptype,SE->_permute);
 | |
| 	  } else {
 | |
| 	    nbr = coalescedRead(CBp[SE->_offset]);
 | |
| 	  }
 | |
| 	  acceleratorSynchronise();
 | |
| 
 | |
| 	  for(int bb=0;bb<nbasis;bb++) {
 | |
| 	    res = res + coalescedRead(Aview_p[point][sU](b,bb))*nbr(bb);
 | |
| 	  }	  
 | |
| 	}
 | |
|       }
 | |
|       coalescedWrite(out_v[sF](b),res);
 | |
|       });
 | |
|       
 | |
|     for(int p=0;p<geom.npoint;p++) AcceleratorViewContainer[p].ViewClose();
 | |
|   };
 | |
| 
 | |
|   void DWDag (const CoarseVector &in, CoarseVector &out)
 | |
|   {
 | |
|     // Inefficient G5 hermitian use
 | |
|     CoarseVector tmp(Grid());
 | |
|     G5C(tmp, in); //There has to be a better way
 | |
|     DW(tmp, out);
 | |
|     G5C(out, out);
 | |
|   };
 | |
| 
 | |
|   typedef Aggregation<Fobj,CComplex,nbasis> Aggregates;
 | |
| 
 | |
|   void PromoteFromSubspace(Aggregates &_Aggregates,CoarseVector &C,FineField &F) 
 | |
|   {
 | |
|     auto FineGrid4 = _Aggregates.FineGrid;
 | |
|     FineField F4(FineGrid4);
 | |
|     CoarseVector C4(Coarse4D);
 | |
|     for(int s=0;s<this->Ls;s++){
 | |
|       ExtractSlice(C4,C,s,0);
 | |
|       _Aggregates.PromoteFromSubspace(C4,F4); 
 | |
|       InsertSlice(F4,F,s,0);
 | |
|     }      
 | |
|   }
 | |
|   void ProjectToSubspace(Aggregates &_Aggregates,CoarseVector &C,FineField &F) 
 | |
|   {
 | |
|     auto FineGrid4 = _Aggregates.FineGrid;
 | |
|     FineField F4(FineGrid4);
 | |
|     CoarseVector C4(Coarse4D);
 | |
|     for(int s=0;s<this->Ls;s++){
 | |
|       ExtractSlice(F4,F,s,0);
 | |
|       _Aggregates.ProjectToSubspace  (C4,F4);
 | |
|       InsertSlice(C4,C,s,0);
 | |
|     }
 | |
|     Project(C);
 | |
|   }
 | |
|   template<class Ddwf>
 | |
|   void Test(Aggregates &_Aggregates,GridBase *FineGrid, Ddwf &_Ddwf)
 | |
|   {
 | |
|     typedef Lattice<Fobj> FineField;
 | |
|     CoarseVector Cin(Coarse5D);
 | |
|     CoarseVector Cout(Coarse5D);
 | |
|     CoarseVector CFout(Coarse5D);
 | |
| 
 | |
|     FineField Fin(FineGrid);
 | |
|     FineField Fout(FineGrid);
 | |
| 
 | |
| 
 | |
|     std::vector<int> seeds({1,2,3,4,5});
 | |
|     GridParallelRNG RNG(Coarse5D);  RNG.SeedFixedIntegers(seeds);
 | |
| 
 | |
|     gaussian(RNG,Cin);
 | |
|     PromoteFromSubspace(_Aggregates,Cin,Fin);
 | |
|     ProjectToSubspace(_Aggregates,Cin,Fin);
 | |
| 
 | |
|     std::cout << GridLogMessage<< "************  "<<std::endl;
 | |
|     std::cout << GridLogMessage<< " Testing M  "<<std::endl;
 | |
|     std::cout << GridLogMessage<< "************  "<<std::endl;
 | |
|     // Coarse operator
 | |
|     this->M(Cin,Cout);
 | |
|     this->Project(Cout);
 | |
|     std::cout << GridLogMessage<< " Cout  "<<norm2(Cout)<<std::endl;
 | |
| 
 | |
|     // Fine projected operator
 | |
|     PromoteFromSubspace(_Aggregates,Cin,Fin);
 | |
|     _Ddwf.M(Fin,Fout);
 | |
|     ProjectToSubspace(_Aggregates,CFout,Fout);
 | |
|     std::cout << GridLogMessage<< " CFout "<<norm2(CFout)<<std::endl;
 | |
|     CFout = CFout-Cout;
 | |
|     std::cout << GridLogMessage<< " diff  "<<norm2(CFout)<<std::endl;
 | |
| 
 | |
|     std::cout << GridLogMessage<< "************  "<<std::endl;
 | |
|     std::cout << GridLogMessage<< " Testing Mdag  "<<std::endl;
 | |
|     std::cout << GridLogMessage<< "************  "<<std::endl;
 | |
|     // Coarse operator
 | |
|     this->Mdag(Cin,Cout);
 | |
|     this->Project(Cout);
 | |
|     std::cout << GridLogMessage<< " Cout  "<<norm2(Cout)<<std::endl;
 | |
| 
 | |
|     // Fine operator
 | |
|     _Ddwf.Mdag(Fin,Fout);
 | |
|     ProjectToSubspace(_Aggregates,CFout,Fout);
 | |
|     std::cout << GridLogMessage<< " CFout "<<norm2(CFout)<<std::endl;
 | |
|     CFout = CFout-Cout;
 | |
|     std::cout << GridLogMessage<< " diff  "<<norm2(CFout)<<std::endl;
 | |
|  
 | |
|   }
 | |
|   virtual std::vector<int> Directions(void)   { return geom.directions;};
 | |
|   virtual std::vector<int> Displacements(void){ return geom.displacements;};
 | |
| };
 | |
| 
 | |
| 
 | |
| template<class Field> class SolverWrapper : public LinearFunction<Field> {
 | |
| private:
 | |
|   LinearOperatorBase<Field> & _Matrix;
 | |
|   OperatorFunction<Field> & _Solver;
 | |
|   LinearFunction<Field>   & _Guess;
 | |
| public:
 | |
|   using LinearFunction<Field>::operator();
 | |
|   /////////////////////////////////////////////////////
 | |
|   // Wrap the usual normal equations trick
 | |
|   /////////////////////////////////////////////////////
 | |
|   SolverWrapper(LinearOperatorBase<Field> &Matrix,
 | |
| 	      OperatorFunction<Field> &Solver,
 | |
| 	      LinearFunction<Field> &Guess) 
 | |
|    :  _Matrix(Matrix), _Solver(Solver), _Guess(Guess) {}; 
 | |
| 
 | |
|   void operator() (const Field &in, Field &out){
 | |
|  
 | |
|     _Guess(in,out);
 | |
|     _Solver(_Matrix,in,out);  // Mdag M out = Mdag in
 | |
| 
 | |
|   }     
 | |
| };
 | |
| 
 | |
| // Must use a non-hermitian solver
 | |
| template<class Matrix,class Field>
 | |
| class PVdagMLinearOperator : public LinearOperatorBase<Field> {
 | |
|   Matrix &_Mat;
 | |
|   Matrix &_PV;
 | |
| public:
 | |
|   PVdagMLinearOperator(Matrix &Mat,Matrix &PV): _Mat(Mat),_PV(PV){};
 | |
| 
 | |
|   virtual std::vector<int> Directions(void)   { return _Mat.Directions();};
 | |
|   virtual std::vector<int> Displacements(void){ return _Mat.Displacements();};
 | |
| 
 | |
|   void OpDiag (const Field &in, Field &out) {
 | |
|     assert(0);
 | |
|   }
 | |
|   void OpDir  (const Field &in, Field &out,int dir,int disp) {
 | |
|     assert(0);
 | |
|   }
 | |
|   void OpDirAll  (const Field &in, std::vector<Field> &out){
 | |
|     assert(0);
 | |
|   };
 | |
|   void Op     (const Field &in, Field &out){
 | |
|     Field tmp(in.Grid());
 | |
|     _Mat.M(in,tmp);
 | |
|     _PV.Mdag(tmp,out);
 | |
|   }
 | |
|   void AdjOp     (const Field &in, Field &out){
 | |
|     Field tmp(in.Grid());
 | |
|     _PV.M(tmp,out);
 | |
|     _Mat.Mdag(in,tmp);
 | |
|   }
 | |
|   void HermOpAndNorm(const Field &in, Field &out,RealD &n1,RealD &n2){
 | |
|     assert(0);
 | |
|   }
 | |
|   void HermOp(const Field &in, Field &out){
 | |
|     assert(0);
 | |
|   }
 | |
| };
 | |
| 
 | |
| RealD InverseApproximation(RealD x){
 | |
|   return 1.0/x;
 | |
| }
 | |
| 
 | |
| template<class Field,class Matrix> class ChebyshevSmoother : public LinearFunction<Field>
 | |
| {
 | |
| public:
 | |
|   using LinearFunction<Field>::operator();
 | |
|   typedef LinearOperatorBase<Field>                            FineOperator;
 | |
|   Matrix         & _SmootherMatrix;
 | |
|   FineOperator   & _SmootherOperator;
 | |
|   
 | |
|   Chebyshev<Field> Cheby;
 | |
| 
 | |
|   ChebyshevSmoother(RealD _lo,RealD _hi,int _ord, FineOperator &SmootherOperator,Matrix &SmootherMatrix) :
 | |
|     _SmootherOperator(SmootherOperator),
 | |
|     _SmootherMatrix(SmootherMatrix),
 | |
|     Cheby(_lo,_hi,_ord,InverseApproximation)
 | |
|   {};
 | |
| 
 | |
|   void operator() (const Field &in, Field &out) 
 | |
|   {
 | |
|     Field tmp(in.Grid());
 | |
|     MdagMLinearOperator<Matrix,Field>   MdagMOp(_SmootherMatrix); 
 | |
|     _SmootherOperator.AdjOp(in,tmp);
 | |
|     Cheby(MdagMOp,tmp,out);         
 | |
|   }
 | |
| };
 | |
| template<class Fobj,class CComplex,int nbasis, class CoarseSolver>
 | |
| class MGPreconditioner : public LinearFunction< Lattice<Fobj> > {
 | |
| public:
 | |
|   using LinearFunction<Lattice<Fobj> >::operator();
 | |
| 
 | |
|   typedef Aggregation<Fobj,CComplex,nbasis> Aggregates;
 | |
|   typedef typename Aggregation<Fobj,CComplex,nbasis>::CoarseVector CoarseVector;
 | |
|   typedef typename Aggregation<Fobj,CComplex,nbasis>::CoarseMatrix CoarseMatrix;
 | |
|   typedef typename Aggregation<Fobj,CComplex,nbasis>::FineField    FineField;
 | |
|   typedef LinearOperatorBase<FineField>                            FineOperator;
 | |
|   typedef LinearFunction    <FineField>                            FineSmoother;
 | |
|   typedef CoarseCayleyFermion<Fobj,CComplex,nbasis> CoarseOperator;
 | |
|   //  typedef SparseMatrixBase<CoarseVector> CoarseOperator;
 | |
| 
 | |
|   Aggregates     & _Aggregates;
 | |
|   FineOperator   & _FineOperator;
 | |
|   FineSmoother   & _PreSmoother;
 | |
|   FineSmoother   & _PostSmoother;
 | |
|   CoarseOperator & _CoarseOperator;
 | |
|   CoarseSolver   & _CoarseSolve;
 | |
| 
 | |
|   int    level;  void Level(int lv) {level = lv; };
 | |
| 
 | |
|   MGPreconditioner(Aggregates &Agg,
 | |
| 		   FineOperator &Fine,
 | |
| 		   FineSmoother &PreSmoother,
 | |
| 		   FineSmoother &PostSmoother,
 | |
| 		   CoarseOperator &CoarseOperator_,
 | |
| 		   CoarseSolver &CoarseSolve_)
 | |
|     : _Aggregates(Agg),
 | |
|       _FineOperator(Fine),
 | |
|       _PreSmoother(PreSmoother),
 | |
|       _PostSmoother(PostSmoother),
 | |
|       _CoarseOperator(CoarseOperator_),
 | |
|       _CoarseSolve(CoarseSolve_),
 | |
|       level(1)  {  }
 | |
| 
 | |
|   virtual void operator()(const FineField &in, FineField & out) 
 | |
|   {
 | |
|     auto CoarseGrid = _CoarseOperator.Grid();
 | |
|     CoarseVector Csrc(CoarseGrid);
 | |
|     CoarseVector Csol(CoarseGrid);
 | |
|     FineField vec1(in.Grid());
 | |
|     FineField vec2(in.Grid());
 | |
| 
 | |
|     std::cout<<GridLogMessage << "Calling PreSmoother " <<std::endl;
 | |
| 
 | |
|     //    std::cout<<GridLogMessage << "Calling PreSmoother input residual "<<norm2(in) <<std::endl;
 | |
|     double t;
 | |
|     // Fine Smoother
 | |
|     t=-usecond();
 | |
|     _PreSmoother(in,out);
 | |
|     t+=usecond();
 | |
| 
 | |
|     std::cout<<GridLogMessage << "PreSmoother took "<< t/1000.0<< "ms" <<std::endl;
 | |
| 
 | |
|     // Update the residual
 | |
|     _FineOperator.Op(out,vec1);  sub(vec1, in ,vec1);   
 | |
|     //    std::cout<<GridLogMessage <<"Residual-1 now " <<norm2(vec1)<<std::endl;
 | |
| 
 | |
|     // Fine to Coarse 
 | |
|     t=-usecond();
 | |
|     _CoarseOperator.ProjectToSubspace(_Aggregates,Csrc,vec1);
 | |
|     //    _Aggregates.ProjectToSubspace  (Csrc,vec1);
 | |
|     t+=usecond();
 | |
|     std::cout<<GridLogMessage << "Project to coarse took "<< t/1000.0<< "ms" <<std::endl;
 | |
| 
 | |
|     // Coarse correction
 | |
|     t=-usecond();
 | |
|     _CoarseSolve(Csrc,Csol);
 | |
|     //Csol=Zero();
 | |
|     t+=usecond();
 | |
|     std::cout<<GridLogMessage << "Coarse solve took "<< t/1000.0<< "ms" <<std::endl;
 | |
| 
 | |
|     // Coarse to Fine
 | |
|     t=-usecond();  
 | |
|     _CoarseOperator.PromoteFromSubspace(_Aggregates,Csol,vec1);
 | |
|     //    _Aggregates.PromoteFromSubspace(Csol,vec1); 
 | |
|     add(out,out,vec1);
 | |
|     t+=usecond();
 | |
|     std::cout<<GridLogMessage << "Promote to this level took "<< t/1000.0<< "ms" <<std::endl;
 | |
| 
 | |
|     // Residual
 | |
|     _FineOperator.Op(out,vec1);  sub(vec1 ,in , vec1);  
 | |
|     //    std::cout<<GridLogMessage <<"Residual-2 now " <<norm2(vec1)<<std::endl;
 | |
| 
 | |
|     // Fine Smoother
 | |
|     t=-usecond();
 | |
|     _PostSmoother(vec1,vec2);
 | |
|     t+=usecond();
 | |
|     std::cout<<GridLogMessage << "PostSmoother took "<< t/1000.0<< "ms" <<std::endl;
 | |
| 
 | |
|     add( out,out,vec2);
 | |
|     std::cout<<GridLogMessage << "Done " <<std::endl;
 | |
|   }
 | |
| };
 | |
| 
 | |
| template<class Fobj,class CComplex,int nbasis, class CoarseSolver>
 | |
| class HDCRPreconditioner : public LinearFunction< Lattice<Fobj> > {
 | |
| public:
 | |
|   using LinearFunction<Lattice<Fobj> >::operator();
 | |
| 
 | |
|   typedef Aggregation<Fobj,CComplex,nbasis> Aggregates;
 | |
|   typedef typename Aggregation<Fobj,CComplex,nbasis>::CoarseVector CoarseVector;
 | |
|   typedef typename Aggregation<Fobj,CComplex,nbasis>::CoarseMatrix CoarseMatrix;
 | |
|   typedef typename Aggregation<Fobj,CComplex,nbasis>::FineField    FineField;
 | |
|   typedef LinearOperatorBase<FineField>                            FineOperator;
 | |
|   typedef LinearFunction    <FineField>                            FineSmoother;
 | |
|   //typedef CoarseCayleyFermion<Fobj,CComplex,nbasis> CoarseOperator;
 | |
|   typedef SparseMatrixBase<CoarseVector> CoarseOperator;
 | |
| 
 | |
|   Aggregates     & _Aggregates;
 | |
|   FineOperator   & _FineOperator;
 | |
|   FineSmoother   & _PreSmoother;
 | |
|   FineSmoother   & _PostSmoother;
 | |
|   CoarseOperator & _CoarseOperator;
 | |
|   CoarseSolver   & _CoarseSolve;
 | |
| 
 | |
|   int    level;  void Level(int lv) {level = lv; };
 | |
| 
 | |
|   HDCRPreconditioner(Aggregates &Agg,
 | |
| 		   FineOperator &Fine,
 | |
| 		   FineSmoother &PreSmoother,
 | |
| 		   FineSmoother &PostSmoother,
 | |
| 		   CoarseOperator &CoarseOperator_,
 | |
| 		   CoarseSolver &CoarseSolve_)
 | |
|     : _Aggregates(Agg),
 | |
|       _FineOperator(Fine),
 | |
|       _PreSmoother(PreSmoother),
 | |
|       _PostSmoother(PostSmoother),
 | |
|       _CoarseOperator(CoarseOperator_),
 | |
|       _CoarseSolve(CoarseSolve_),
 | |
|       level(1)  {  }
 | |
| 
 | |
|   virtual void operator()(const FineField &in, FineField & out) 
 | |
|   {
 | |
|     auto CoarseGrid = _CoarseOperator.Grid();
 | |
|     CoarseVector Csrc(CoarseGrid);
 | |
|     CoarseVector g5Csrc(CoarseGrid);
 | |
|     CoarseVector Csol(CoarseGrid);
 | |
|     FineField vec1(in.Grid());
 | |
|     FineField vec2(in.Grid());
 | |
| 
 | |
|     std::cout<<GridLogMessage<<"\t\t\t" << "Calling PreSmoother " <<std::endl;
 | |
| 
 | |
|     double t;
 | |
|     // Fine Smoother
 | |
|     t=-usecond();
 | |
|     _PreSmoother(in,out);
 | |
|     t+=usecond();
 | |
| 
 | |
|     std::cout<<GridLogMessage<<"\t\t\t" << "PreSmoother took "<< t/1000.0<< "ms" <<std::endl;
 | |
|     // Update the residual
 | |
|     _FineOperator.Op(out,vec1);  sub(vec1, in ,vec1);   
 | |
| 
 | |
|     // Fine to Coarse 
 | |
|     // Based on a coarsening of G5R5 D
 | |
|     // Solves Ddwf out = in
 | |
|     // Coarse operator is g5R5 Ddwf solves g5R5 Ddwf out = in  
 | |
|     t=-usecond();
 | |
|     G5R5(vec2,vec1);
 | |
|     _Aggregates.ProjectToSubspace  (Csrc,vec2);
 | |
|     t+=usecond();
 | |
|     std::cout<<GridLogMessage<<"\t\t\t" << "Project to coarse took "<< t/1000.0<< "ms" <<std::endl;
 | |
| 
 | |
|     // Coarse correction
 | |
|     t=-usecond();
 | |
|     _CoarseSolve(Csrc,Csol);
 | |
|     t+=usecond();
 | |
|     std::cout<<GridLogMessage<<"\t\t\t" << "Coarse solve took "<< t/1000.0<< "ms" <<std::endl;
 | |
| 
 | |
|     // Coarse to Fine
 | |
|     t=-usecond();  
 | |
|     _Aggregates.PromoteFromSubspace(Csol,vec1); 
 | |
|     add(out,out,vec1);
 | |
|     t+=usecond();
 | |
|     std::cout<<GridLogMessage<<"\t\t\t" << "Promote to this level took "<< t/1000.0<< "ms" <<std::endl;
 | |
| 
 | |
|     // Residual
 | |
|     _FineOperator.Op(out,vec1);  sub(vec1 ,in , vec1);  
 | |
| 
 | |
|     // Fine Smoother
 | |
|     t=-usecond();
 | |
|     _PostSmoother(vec1,vec2);
 | |
|     t+=usecond();
 | |
|     std::cout<<GridLogMessage<<"\t\t\t" << "PostSmoother took "<< t/1000.0<< "ms" <<std::endl;
 | |
| 
 | |
|     add( out,out,vec2);
 | |
|   }
 | |
| };
 | |
| 
 | |
| int main (int argc, char ** argv)
 | |
| {
 | |
|   Grid_init(&argc,&argv);
 | |
| 
 | |
|   const int Ls=24;
 | |
| 
 | |
|   GridCartesian         * UGrid   = SpaceTimeGrid::makeFourDimGrid(GridDefaultLatt(), GridDefaultSimd(Nd,vComplex::Nsimd()),GridDefaultMpi());
 | |
|   GridRedBlackCartesian * UrbGrid = SpaceTimeGrid::makeFourDimRedBlackGrid(UGrid);
 | |
| 
 | |
|   GridCartesian         * FGrid   = SpaceTimeGrid::makeFiveDimGrid(Ls,UGrid);
 | |
|   GridRedBlackCartesian * FrbGrid = SpaceTimeGrid::makeFiveDimRedBlackGrid(Ls,UGrid);
 | |
| 
 | |
|   ///////////////////////////////////////////////////
 | |
|   // Construct a coarsened grid; utility for this?
 | |
|   ///////////////////////////////////////////////////
 | |
|   std::vector<int> block ({2,2,2,2}); // 4,2,2,2 gets worse
 | |
|   std::vector<int> blockc ({1,1,1,1});
 | |
|   const int nbasis= 24;
 | |
|   const int nbasisc= 32; // decrease, not improvement
 | |
| 
 | |
|   auto clatt = GridDefaultLatt();
 | |
|   for(int d=0;d<clatt.size();d++){
 | |
|     clatt[d] = clatt[d]/block[d];
 | |
|   }
 | |
|   auto cclatt = clatt;
 | |
|   for(int d=0;d<clatt.size();d++){
 | |
|     cclatt[d] = clatt[d]/blockc[d];
 | |
|   }
 | |
| 
 | |
|   GridCartesian *Coarse4d =  SpaceTimeGrid::makeFourDimGrid(clatt, GridDefaultSimd(Nd,vComplex::Nsimd()),GridDefaultMpi());;
 | |
|   GridCartesian *Coarse5d =  SpaceTimeGrid::makeFiveDimGrid(Ls,Coarse4d);
 | |
| 
 | |
|   GridCartesian *CoarseCoarse4d =  SpaceTimeGrid::makeFourDimGrid(cclatt, GridDefaultSimd(Nd,vComplex::Nsimd()),GridDefaultMpi());;
 | |
|   GridCartesian *CoarseCoarse5d =  SpaceTimeGrid::makeFiveDimGrid(1,CoarseCoarse4d);
 | |
| 
 | |
|   std::vector<int> seeds({1,2,3,4});
 | |
|   GridParallelRNG          RNG5(FGrid);   RNG5.SeedFixedIntegers(seeds);
 | |
|   GridParallelRNG          RNG4(UGrid);   RNG4.SeedFixedIntegers(seeds);
 | |
|   GridParallelRNG          CRNG(Coarse4d);CRNG.SeedFixedIntegers(seeds);
 | |
| 
 | |
|   LatticeGaugeField Umu(UGrid); 
 | |
| #if 0
 | |
|   SU3::TepidConfiguration(RNG4,Umu);
 | |
|   RealD M5=1.0;
 | |
| #else
 | |
|   std::string file("./ckpoint_lat.1000");
 | |
|   FieldMetaData header;
 | |
|   NerscIO::readConfiguration(Umu,header,file);
 | |
|   RealD M5=1.8;
 | |
| #endif
 | |
| 
 | |
|   std::cout<<GridLogMessage << "**************************************************"<< std::endl;
 | |
|   std::cout<<GridLogMessage << "Building g5R5 hermitian DWF operator" <<std::endl;
 | |
|   std::cout<<GridLogMessage << "**************************************************"<< std::endl;
 | |
| 
 | |
|   RealD mass=0.00078;
 | |
| 
 | |
|   WilsonFermionD     Dw(Umu,*UGrid,*UrbGrid,-M5);
 | |
|   DomainWallFermionD Ddwf(Umu,*FGrid,*FrbGrid,*UGrid,*UrbGrid,mass,M5);
 | |
|   DomainWallFermionD Dpv (Umu,*FGrid,*FrbGrid,*UGrid,*UrbGrid,1.0,M5);
 | |
| 
 | |
|   typedef Aggregation<vSpinColourVector,vTComplex,nbasis>              Subspace;
 | |
|   typedef CoarsenedMatrix<vSpinColourVector,vTComplex,nbasis>          CoarseOperator;
 | |
|   typedef CoarseOperator::CoarseVector                                 CoarseVector;
 | |
|   typedef CoarseOperator::siteVector siteVector;
 | |
| 
 | |
|   std::cout<<GridLogMessage << "**************************************************"<< std::endl;
 | |
|   std::cout<<GridLogMessage << "Calling Aggregation class to build subspace" <<std::endl;
 | |
|   std::cout<<GridLogMessage << "**************************************************"<< std::endl;
 | |
|   // How to find criticall mass?
 | |
|   // WilsonFermionD     Dw_null(Umu,*UGrid,*UrbGrid,-0.75); //   600 iters
 | |
|   // WilsonFermionD     Dw_null(Umu,*UGrid,*UrbGrid,-0.80); //   800 iters
 | |
|   //  WilsonFermionD     Dw_null(Umu,*UGrid,*UrbGrid,-0.82); // 1023 iters
 | |
|   //  WilsonFermionD     Dw_null(Umu,*UGrid,*UrbGrid,-0.85); // 1428 iters
 | |
|   //  WilsonFermionD     Dw_null(Umu,*UGrid,*UrbGrid,-0.87); //  1900 iters
 | |
|   //  WilsonFermionD     Dw_null(Umu,*UGrid,*UrbGrid,-0.90); // 3900   iters
 | |
|   //  WilsonFermionD     Dw_null(Umu,*UGrid,*UrbGrid,-0.92); // 6200   iters
 | |
|   //  WilsonFermionD     Dw_null(Umu,*UGrid,*UrbGrid,-0.94);  // 8882 iters
 | |
|   WilsonFermionD     Dw_null(Umu,*UGrid,*UrbGrid,-0.95);  // 9170  iters
 | |
|   //  WilsonFermionD     Dw_null(Umu,*UGrid,*UrbGrid,-0.96);  // 8882   iters
 | |
|   //  WilsonFermionD     Dw_null(Umu,*UGrid,*UrbGrid,-0.97);  // 8406  iters
 | |
|   //  WilsonFermionD     Dw_null(Umu,*UGrid,*UrbGrid,-0.99); // 6900   iters
 | |
|   //  WilsonFermionD     Dw_null(Umu,*UGrid,*UrbGrid,-1.01); // 6397   iters
 | |
|   //  WilsonFermionD     Dw_null(Umu,*UGrid,*UrbGrid,-1.00); // 5900   iters
 | |
|   MdagMLinearOperator<WilsonFermionD,LatticeFermion> MdagM_Dw(Dw_null);
 | |
| 
 | |
|   std::cout<<GridLogMessage << "**************************************************"<< std::endl;
 | |
|   std::cout<<GridLogMessage << "Testing Wilson criticality " <<std::endl;
 | |
|   std::cout<<GridLogMessage << "**************************************************"<< std::endl;
 | |
|   /*
 | |
|   ConjugateGradient<LatticeFermion>          WilsonCG(1.0e-10,40000);
 | |
|   LatticeFermion w_src(UGrid); w_src=1.0;
 | |
|   LatticeFermion w_res(UGrid);
 | |
|   WilsonCG(MdagM_Dw,w_src,w_res);
 | |
|   exit(0);
 | |
|   */
 | |
|   std::cout<<GridLogMessage << "**************************************************"<< std::endl;
 | |
|   std::cout<<GridLogMessage << " 4D subspace build                                " <<std::endl;
 | |
|   std::cout<<GridLogMessage << "**************************************************"<< std::endl;
 | |
|   Subspace Aggregates4D(Coarse4d,UGrid,0);
 | |
|   assert ( (nbasis & 0x1)==0);
 | |
|   int nb=nbasis/2;
 | |
|   Gamma g5(Gamma::Algebra::Gamma5);
 | |
| 
 | |
|   Aggregates4D.CreateSubspaceChebyshev(RNG4,MdagM_Dw,nb,60.0,3.0,300,150,150,0.0); // now at 26 iter
 | |
|   //  Aggregates4D.CreateSubspaceChebyshev(RNG4,MdagM_Dw,nb,60.0,3.0,300,150,150,0.0); // now at 26 iter
 | |
|   //  Aggregates4D.CreateSubspaceChebyshev(RNG4,MdagM_Dw,nb,60.0,3.0,500,150,150,0.0); // now at 26 iter
 | |
|   //  Aggregates4D.CreateSubspaceChebyshev(RNG4,MdagM_Dw,nb,60.0,4.0,500,150,150,0.0); // now at 26 iter
 | |
|   //  Aggregates4D.CreateSubspaceChebyshev(RNG4,MdagM_Dw,nb,60.0,4.0,500,150,150,0.0); //35
 | |
|   //  Aggregates4D.CreateSubspaceChebyshev(RNG4,MdagM_Dw,nb,60.0,4.0,600,100,250,0.0); //39
 | |
|   //  Aggregates4D.CreateSubspaceChebyshev(RNG4,MdagM_Dw,nb,60.0,4.0,600,250,100,0.0); //39
 | |
|   //  Aggregates4D.CreateSubspaceChebyshev(RNG4,MdagM_Dw,nb,60.0,4.0,600,100,100,0.0); //36
 | |
|   //  Aggregates4D.CreateSubspaceChebyshev(RNG4,MdagM_Dw,nb,60.0,4.0,600,250,100,0.0); //39
 | |
|   //   Aggregates4D.CreateSubspaceChebyshev(RNG4,MdagM_Dw,nb,60.0,4.0,600,250,50,0.0);// 39
 | |
|   //  Aggregates4D.CreateSubspaceChebyshev(RNG4,MdagM_Dw,nb,60.0,4.0,600,250,250,0.0);// 35
 | |
|   //  Aggregates4D.CreateSubspaceChebyshev(RNG4,MdagM_Dw,nb,60.0,4.0,250,250,250,0.0);//  38 iter
 | |
|   //  Aggregates4D.CreateSubspaceChebyshev(RNG4,MdagM_Dw,nb,50.0,4.0,250,250,100,0.0);//  40 iter
 | |
|   //  Aggregates4D.CreateSubspaceChebyshev(RNG4,MdagM_Dw,nb,50.0,4.0,500,100,100,0.0);// 38 iter
 | |
|   //  Aggregates4D.CreateSubspaceChebyshev(RNG4,MdagM_Dw,nb,60.0,4.0,500,100,100,0.0);// 36 iter
 | |
|   //  Aggregates4D.CreateSubspaceChebyshev(RNG4,MdagM_Dw,nb,60.0,3.0,500,100,100,0.0);// 37 iter
 | |
|   //  Aggregates4D.CreateSubspaceChebyshev(RNG4,MdagM_Dw,nb,60.0,1.0,1000,400,400,0.0);// 38 iter
 | |
|   //  Aggregates4D.CreateSubspaceChebyshev(RNG4,MdagM_Dw,nb,60.0,0.5,1000,400,400,0.0);// 39 iter HDCR smooth 14
 | |
|   //  Aggregates4D.CreateSubspaceChebyshev(RNG4,MdagM_Dw,nb,60.0,0.1,1000,400,400,0.0);// 41
 | |
|   for(int n=0;n<nb;n++){
 | |
|     Aggregates4D.subspace[nbasis-1-n]= Aggregates4D.subspace[n] - g5 * Aggregates4D.subspace[n];
 | |
|     Aggregates4D.subspace[n]         = Aggregates4D.subspace[n] + g5 * Aggregates4D.subspace[n];
 | |
|   }
 | |
|   std::cout<<GridLogMessage << "**************************************************"<< std::endl;
 | |
|   std::cout<<GridLogMessage << " Coarsen the Dw operator                          " <<std::endl;
 | |
|   std::cout<<GridLogMessage << "**************************************************"<< std::endl;
 | |
|   typedef CoarsenedMatrix<vSpinColourVector,vTComplex,nbasis>    Level1Op4;
 | |
|   typedef CoarseCayleyFermion<vSpinColourVector,vTComplex,nbasis> Level1Op5;
 | |
|   Level1Op4 c_Dw    (*Coarse4d,0);
 | |
|   NonHermitianLinearOperator<WilsonFermionD,LatticeFermion>  LinOpDw(Dw);
 | |
|   c_Dw.CoarsenOperator(UGrid,LinOpDw,Aggregates4D); // contains the M5 from Dw(-M5)
 | |
|   //  c_Dw.Test(Aggregates4D,UGrid,LinOpDw);
 | |
| 
 | |
|   std::cout<<GridLogMessage << "**************************************************"<< std::endl;
 | |
|   std::cout<<GridLogMessage << " Build coarse DWF operator                          " <<std::endl;
 | |
|   std::cout<<GridLogMessage << "**************************************************"<< std::endl;
 | |
|   Level1Op5 c_Dwf  (*Coarse4d,*Coarse5d,c_Dw,M5, mass, Ls, 1.0,0.0);
 | |
|   //  c_Dwf.Test(Aggregates4D,FGrid,Ddwf);
 | |
| 
 | |
|   MdagMLinearOperator<Level1Op5,CoarseVector> MdagM_cDwf(c_Dwf);
 | |
| 
 | |
|   std::cout<<GridLogMessage << "**************************************************"<< std::endl;
 | |
|   std::cout<<GridLogMessage << "Build 5D coarse deflation space" << std::endl;
 | |
|   std::cout<<GridLogMessage << "**************************************************"<< std::endl;
 | |
|   int nbc=nbasisc/2;
 | |
|   typedef CoarsenedMatrix<siteVector,iScalar<vTComplex>,nbasisc>     Level2Op;
 | |
|   typedef Aggregation<siteVector,iScalar<vTComplex>,nbasisc> CoarseSubspace;
 | |
|   CoarseSubspace CoarseAggregates(CoarseCoarse5d,Coarse5d,0);
 | |
| 
 | |
|   std::cout<<GridLogMessage << "**************************************************"<< std::endl;
 | |
|   std::cout<<GridLogMessage << "Build Chebyshev space in coarse operator "<< std::endl;
 | |
|   std::cout<<GridLogMessage << "**************************************************"<< std::endl;
 | |
|   CoarseAggregates.CreateSubspaceChebyshev(CRNG,MdagM_cDwf,nbc,40.0,0.01,300,150,100,0.0);
 | |
| 
 | |
|   {
 | |
|     std::cout<<GridLogMessage << "**************************************************"<< std::endl;
 | |
|     std::cout<<GridLogMessage << "Applying G5R5 projection of coarse operator "<< std::endl;
 | |
|     std::cout<<GridLogMessage << "**************************************************"<< std::endl;
 | |
|     CoarseVector A(Coarse5d), B(Coarse5d);
 | |
|     for(int n=0;n<nbc;n++){
 | |
|       std::cout << " n " << n << " " << 4.0*norm2(CoarseAggregates.subspace[n])<<std::endl;
 | |
|       G5R5(B,CoarseAggregates.subspace[n]);
 | |
|       A = CoarseAggregates.subspace[n];
 | |
|       CoarseAggregates.subspace[n]    = A+B; // 1+G5R5 // eigen value of G5R5 is +1
 | |
|       CoarseAggregates.subspace[n+nbc]= A-B; // 1-G5R5 // eigen value of G5R5 is -1
 | |
|       std::cout << norm2(CoarseAggregates.subspace[n])<<" "<< norm2(CoarseAggregates.subspace[n+nbc])<<std::endl;
 | |
|       std::cout << norm2(CoarseAggregates.subspace[n])+ norm2(CoarseAggregates.subspace[n+nbc])<<std::endl;
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   Gamma5R5HermitianLinearOperator<Level1Op5,CoarseVector> L1Hdwf(c_Dwf);
 | |
|   GridRedBlackCartesian * CoarseCoarse5dRB = SpaceTimeGrid::makeFiveDimRedBlackGrid(1,CoarseCoarse4d);
 | |
|   Level2Op cc_Dwf  (*CoarseCoarse5d,*CoarseCoarse5dRB,1); // say it is hermitian
 | |
|   cc_Dwf.CoarsenOperator(Coarse5d,L1Hdwf,CoarseAggregates);
 | |
|   //  cc_Dwf.Test(CoarseAggregates,Coarse5d,L1Hdwf);
 | |
| 
 | |
|   typedef Level2Op::CoarseVector CoarseCoarseVector;
 | |
| 
 | |
|   std::cout<<GridLogMessage << "**************************************************"<< std::endl;
 | |
|   std::cout<<GridLogMessage << " Testing fine and coarse solvers " <<std::endl;
 | |
|   std::cout<<GridLogMessage << "**************************************************"<< std::endl;
 | |
| 
 | |
|   RealD tol=1.0e-8;
 | |
|   int MaxIt = 10000;
 | |
| 
 | |
|   CoarseVector c_src(Coarse5d); c_src=1.0;
 | |
|   CoarseVector c_res(Coarse5d);
 | |
| 
 | |
|   LatticeFermion f_src(FGrid); f_src=1.0;
 | |
|   LatticeFermion f_res(FGrid);
 | |
| 
 | |
|   LatticeFermion f_src_e(FrbGrid); f_src_e=1.0;
 | |
|   LatticeFermion f_res_e(FrbGrid);
 | |
| 
 | |
|   CoarseCoarseVector cc_src(CoarseCoarse5d); cc_src=1.0;
 | |
| 
 | |
|   ConjugateGradient<CoarseVector>            CoarseCG(tol,MaxIt);
 | |
|   ConjugateGradient<LatticeFermion>          FineCG(tol,MaxIt);
 | |
|   
 | |
|   NonHermitianLinearOperator<DomainWallFermionD,LatticeFermion> FineM(Ddwf);
 | |
|   MdagMLinearOperator<DomainWallFermionD,LatticeFermion>    FineMdagM(Ddwf);     //  M^\dag M
 | |
| 
 | |
|   NonHermitianLinearOperator<Level1Op5,CoarseVector> CoarseM(c_Dwf);
 | |
|   MdagMLinearOperator<Level1Op5,CoarseVector> CoarseMdagM(c_Dwf);
 | |
| 
 | |
|   NonHermitianLinearOperator<Level2Op,CoarseCoarseVector> CoarseCoarseM(cc_Dwf);
 | |
|   MdagMLinearOperator<Level2Op,CoarseCoarseVector> CoarseCoarseMdagM(cc_Dwf);
 | |
| 
 | |
| 
 | |
|   std::cout<<GridLogMessage << "**************************************************"<< std::endl;
 | |
|   std::cout<<GridLogMessage << " Fine    Hw PowerMethod           "<< std::endl;
 | |
|   LatticeFermion w_src(UGrid); 
 | |
|   w_src=1.0;
 | |
|   PowerMethod<LatticeFermion>       PM;   PM(MdagM_Dw,w_src);
 | |
|   std::cout<<GridLogMessage << " Coarse       PowerMethod           "<< std::endl;
 | |
|   c_src=1.0;
 | |
|   PowerMethod<CoarseVector>        cPM;  cPM(CoarseMdagM,c_src);
 | |
| 
 | |
|   cc_src=1.0;
 | |
|   PowerMethod<CoarseCoarseVector>        ccPM;  ccPM(CoarseCoarseMdagM,cc_src);
 | |
| 
 | |
|   std::cout<<GridLogMessage << "**************************************************"<< std::endl;
 | |
|   std::cout<<GridLogMessage << " Running CoarseCoarse grid Lanczos "<< std::endl;
 | |
|   std::cout<<GridLogMessage << "**************************************************"<< std::endl;
 | |
| 
 | |
|   // 37s, 26 iter
 | |
|   int cNk=128;
 | |
|   int cNm=256;
 | |
|   int cNstop=128;
 | |
|   RealD IRL_lo=0.01;
 | |
|   RealD IRL_hi=16.0;
 | |
|   int IRL_ord=201;
 | |
| 
 | |
|   /*
 | |
|   //  int cNk=100; -- slower 27 iters
 | |
|   int cNk=128; //-- 26 iters, but slower
 | |
|   int cNm=192;
 | |
|   int cNstop=128;
 | |
|   RealD IRL_lo=0.005;
 | |
|   RealD IRL_hi=10.0;
 | |
|   int IRL_ord=101;
 | |
|   */
 | |
| 
 | |
|   MdagMLinearOperator<Level2Op,CoarseCoarseVector> IRLHermOpL2(cc_Dwf);
 | |
|   Chebyshev<CoarseCoarseVector> IRLChebyL2(IRL_lo,IRL_hi,IRL_ord);
 | |
|   FunctionHermOp<CoarseCoarseVector> IRLOpChebyL2(IRLChebyL2,IRLHermOpL2);
 | |
|   PlainHermOp<CoarseCoarseVector> IRLOpL2    (IRLHermOpL2);
 | |
|   ImplicitlyRestartedLanczos<CoarseCoarseVector> IRLL2(IRLOpChebyL2,IRLOpL2,cNstop,cNk,cNm,1.0e-3,20);
 | |
| 
 | |
|   cNm=0;
 | |
|   std::vector<RealD>          eval2(cNm);
 | |
|   std::vector<CoarseCoarseVector>   evec2(cNm,CoarseCoarse5d);
 | |
|   cc_src=1.0;
 | |
|   //  int cNconv;
 | |
|   //  IRLL2.calc(eval2,evec2,cc_src,cNconv);
 | |
| 
 | |
|   ConjugateGradient<CoarseCoarseVector>  CoarseCoarseCG(0.02,10000);
 | |
|   DeflatedGuesser<CoarseCoarseVector> DeflCoarseCoarseGuesser(evec2,eval2);
 | |
|   NormalEquations<CoarseCoarseVector> DeflCoarseCoarseCGNE(cc_Dwf,CoarseCoarseCG,DeflCoarseCoarseGuesser);
 | |
| 
 | |
|   //  ZeroGuesser<CoarseVector> CoarseZeroGuesser;
 | |
|   ZeroGuesser<CoarseCoarseVector>       CoarseCoarseZeroGuesser;
 | |
| 
 | |
|   std::cout<<GridLogMessage << "**************************************************"<< std::endl;
 | |
|   std::cout<<GridLogMessage << "Building 3 level hdcr                             "<< std::endl;
 | |
|   std::cout<<GridLogMessage << "**************************************************"<< std::endl;
 | |
|   NormalEquations<CoarseCoarseVector>   CoarseCoarseCGNE(cc_Dwf,CoarseCoarseCG,CoarseCoarseZeroGuesser);
 | |
|   {
 | |
| typedef HDCRPreconditioner<siteVector,iScalar<vTComplex>,nbasisc,NormalEquations<CoarseCoarseVector> > CoarseMG;
 | |
|   typedef MGPreconditioner<vSpinColourVector,  vTComplex,nbasis, LinearFunction<CoarseVector> >     ThreeLevelMG;
 | |
| 
 | |
|   // MultiGrid preconditioner acting on the coarse space <-> coarsecoarse space
 | |
|   ChebyshevSmoother<CoarseVector,  Level1Op5 >       CoarseSmoother1(0.5,22.0,12,CoarseM,c_Dwf); // 37s, 26 iter
 | |
|   ChebyshevSmoother<CoarseVector,  Level1Op5 >       CoarseSmoother2(0.5,22.0,12,CoarseM,c_Dwf);
 | |
| 
 | |
|   //  ChebyshevSmoother<CoarseVector,  Level1Op5 >       CoarseSmoother1(0.5,22.0,7,CoarseM,c_Dwf); // 38s, 26 iter
 | |
|   //  ChebyshevSmoother<CoarseVector,  Level1Op5 >       CoarseSmoother2(0.5,22.0,7,CoarseM,c_Dwf);
 | |
|   //  ChebyshevSmoother<CoarseVector,  Level1Op5 >       CoarseSmoother1(0.4,22.0,7,CoarseM,c_Dwf); // 41s, 27 iter
 | |
|   //  ChebyshevSmoother<CoarseVector,  Level1Op5 >       CoarseSmoother2(0.4,22.0,7,CoarseM,c_Dwf);
 | |
|   //  ChebyshevSmoother<CoarseVector,  Level1Op5 >       CoarseSmoother1(0.6,22.0,6,CoarseM,c_Dwf); // 26 iter
 | |
|   //  ChebyshevSmoother<CoarseVector,  Level1Op5 >       CoarseSmoother2(0.6,22.0,6,CoarseM,c_Dwf);
 | |
|   //  ChebyshevSmoother<CoarseVector,  Level1Op5 >       CoarseSmoother1(0.5,22.0,5,CoarseM,c_Dwf); // 33 iter, 55s
 | |
|   //  ChebyshevSmoother<CoarseVector,  Level1Op5 >       CoarseSmoother2(0.5,22.0,5,CoarseM,c_Dwf);
 | |
| 
 | |
| 
 | |
|   CoarseMG Level2Precon (CoarseAggregates,
 | |
| 			 CoarseM,
 | |
| 			 CoarseSmoother1,
 | |
| 			 CoarseSmoother2,
 | |
| 			 cc_Dwf,
 | |
| 			 DeflCoarseCoarseCGNE);
 | |
|   Level2Precon.Level(2);
 | |
| 
 | |
|   //PrecGeneralisedConjugateResidualNonHermitian<CoarseVector>  L2PGCR(0.5, 100, CoarseM,Level2Precon,16,16); // 26 iter, 37s
 | |
|   // PGCR Applying this solver to solve the coarse space problem
 | |
|   // COULD BE FIXED???
 | |
|   PrecGeneralisedConjugateResidualNonHermitian<CoarseVector>  L2PGCR(0.0, 1, CoarseM,Level2Precon,2,2); 
 | |
| 
 | |
|   //PrecGeneralisedConjugateResidualNonHermitian<CoarseVector>  L2PGCR(1.0, 100, CoarseM,Level2Precon,16,16); // 35 iter, 45s
 | |
|   //PrecGeneralisedConjugateResidualNonHermitian<CoarseVector>  L2PGCR(0.6, 100, CoarseM,Level2Precon,16,16); // 26,38 (diifferene is measurement noise)
 | |
|   //PrecGeneralisedConjugateResidualNonHermitian<CoarseVector>  L2PGCR(0.2, 100, CoarseM,Level2Precon,16,16); // 26 iter, 47s
 | |
|   L2PGCR.Level(2);
 | |
| 
 | |
|   // Wrap the 2nd level solver in a MultiGrid preconditioner acting on the fine space
 | |
| 
 | |
|   //  ChebyshevSmoother<LatticeFermion,DomainWallFermionD> FineSmoother1(0.5,60.0,14,FineM,Ddwf); // 26 iter, 39s
 | |
|   //  ChebyshevSmoother<LatticeFermion,DomainWallFermionD> FineSmoother2(0.5,60.0,14,FineM,Ddwf);
 | |
| 
 | |
|   //  ChebyshevSmoother<LatticeFermion,DomainWallFermionD> FineSmoother1(0.5,60.0,12,FineM,Ddwf); // 25 iter, 38s
 | |
|   //  ChebyshevSmoother<LatticeFermion,DomainWallFermionD> FineSmoother2(0.5,60.0,16,FineM,Ddwf);
 | |
| 
 | |
|   //  ChebyshevSmoother<LatticeFermion,DomainWallFermionD> FineSmoother1(0.5,60.0,12,FineM,Ddwf); // 23 iter, 39s
 | |
|   //  ChebyshevSmoother<LatticeFermion,DomainWallFermionD> FineSmoother2(0.5,60.0,20,FineM,Ddwf);
 | |
| 
 | |
|   //  ChebyshevSmoother<LatticeFermion,DomainWallFermionD> FineSmoother1(0.5,60.0,10,FineM,Ddwf);24 iter, 44s
 | |
|   //  ChebyshevSmoother<LatticeFermion,DomainWallFermionD> FineSmoother2(0.5,60.0,24,FineM,Ddwf);
 | |
| 
 | |
|   //  ChebyshevSmoother<LatticeFermion,DomainWallFermionD> FineSmoother1(0.5,60.0,12,FineM,Ddwf); // odd convergence tail at 10^-9 ish
 | |
|   //  ChebyshevSmoother<LatticeFermion,DomainWallFermionD> FineSmoother2(0.1,60.0,24,FineM,Ddwf); // 33 iter, waas O(10-9 by 26)
 | |
| 
 | |
|   //  ChebyshevSmoother<LatticeFermion,DomainWallFermionD> FineSmoother1(0.5,60.0,12,FineM,Ddwf); // 25 iter, 39s
 | |
|   //  ChebyshevSmoother<LatticeFermion,DomainWallFermionD> FineSmoother2(0.5,60.0,18,FineM,Ddwf); //
 | |
| 
 | |
|   ChebyshevSmoother<LatticeFermion,DomainWallFermionD> FineSmoother1(0.5,60.0,16,FineM,Ddwf); 
 | |
|   ChebyshevSmoother<LatticeFermion,DomainWallFermionD> FineSmoother2(0.5,60.0,16,FineM,Ddwf); //
 | |
| 
 | |
|   //  ChebyshevSmoother<LatticeFermion,DomainWallFermionD> FineSmoother1(0.5,60.0,11,FineM,Ddwf); // 33 iter, 49s
 | |
|   //  ChebyshevSmoother<LatticeFermion,DomainWallFermionD> FineSmoother2(0.5,60.0,11,FineM,Ddwf);
 | |
|   //  ChebyshevSmoother<LatticeFermion,DomainWallFermionD> FineSmoother1(0.5,60.0,12,FineM,Ddwf); // 26 iter, 37s
 | |
|   //  ChebyshevSmoother<LatticeFermion,DomainWallFermionD> FineSmoother2(0.5,60.0,12,FineM,Ddwf);
 | |
|   //  ChebyshevSmoother<LatticeFermion,DomainWallFermionD> FineSmoother1(0.4,60.0,12,FineM,Ddwf); //  iter 26 no change in final residual
 | |
|   //  ChebyshevSmoother<LatticeFermion,DomainWallFermionD> FineSmoother2(0.4,60.0,12,FineM,Ddwf);
 | |
|   //  ChebyshevSmoother<LatticeFermion,DomainWallFermionD> FineSmoother1(0.3,60.0,12,FineM,Ddwf); // 27 iter 39s.
 | |
|   //  ChebyshevSmoother<LatticeFermion,DomainWallFermionD> FineSmoother2(0.3,60.0,12,FineM,Ddwf);
 | |
|   //  ChebyshevSmoother<LatticeFermion,DomainWallFermionD> FineSmoother1(0.3,60.0,13,FineM,Ddwf); // 26 iter, but slower
 | |
|   //  ChebyshevSmoother<LatticeFermion,DomainWallFermionD> FineSmoother2(0.3,60.0,13,FineM,Ddwf);
 | |
|   //  ChebyshevSmoother<LatticeFermion,DomainWallFermionD> FineSmoother1(1.0,60.0,12,FineM,Ddwf); // 34 iter, slower
 | |
|   //  ChebyshevSmoother<LatticeFermion,DomainWallFermionD> FineSmoother2(1.0,60.0,12,FineM,Ddwf);
 | |
| 
 | |
|   ThreeLevelMG ThreeLevelPrecon(Aggregates4D,
 | |
| 				FineM,
 | |
| 				FineSmoother1,
 | |
| 				FineSmoother2,
 | |
| 				c_Dwf,
 | |
| 				L2PGCR);
 | |
|   ThreeLevelPrecon.Level(1);
 | |
| 
 | |
|   PrecGeneralisedConjugateResidualNonHermitian<LatticeFermion> L1PGCR(1.0e-8,1000,FineM,ThreeLevelPrecon,16,16);
 | |
|   L1PGCR.Level(1);
 | |
| 
 | |
|   f_res=Zero();
 | |
|   L1PGCR(f_src,f_res);
 | |
|   }
 | |
|   
 | |
|   std::cout<<GridLogMessage << "**************************************************"<< std::endl;
 | |
|   std::cout<<GridLogMessage << "Done "<< std::endl;
 | |
|   std::cout<<GridLogMessage << "**************************************************"<< std::endl;
 | |
|   Grid_finalize();
 | |
|   
 | |
| }
 |