mirror of
				https://github.com/paboyle/Grid.git
				synced 2025-10-25 10:09:34 +01:00 
			
		
		
		
	
		
			
				
	
	
		
			250 lines
		
	
	
		
			7.1 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			250 lines
		
	
	
		
			7.1 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
|     /*************************************************************************************
 | |
| 
 | |
|     Grid physics library, www.github.com/paboyle/Grid 
 | |
| 
 | |
|     Source file: ./lib/qcd/action/fermion/CayleyFermion5D.cc
 | |
| 
 | |
|     Copyright (C) 2015
 | |
| 
 | |
| Author: Peter Boyle <pabobyle@ph.ed.ac.uk>
 | |
| Author: Peter Boyle <paboyle@ph.ed.ac.uk>
 | |
| Author: Peter Boyle <peterboyle@Peters-MacBook-Pro-2.local>
 | |
| Author: paboyle <paboyle@ph.ed.ac.uk>
 | |
| 
 | |
|     This program is free software; you can redistribute it and/or modify
 | |
|     it under the terms of the GNU General Public License as published by
 | |
|     the Free Software Foundation; either version 2 of the License, or
 | |
|     (at your option) any later version.
 | |
| 
 | |
|     This program is distributed in the hope that it will be useful,
 | |
|     but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
|     MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | |
|     GNU General Public License for more details.
 | |
| 
 | |
|     You should have received a copy of the GNU General Public License along
 | |
|     with this program; if not, write to the Free Software Foundation, Inc.,
 | |
|     51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
 | |
| 
 | |
|     See the full license in the file "LICENSE" in the top level distribution directory
 | |
|     *************************************************************************************/
 | |
|     /*  END LEGAL */
 | |
| 
 | |
| #include <Grid/qcd/action/fermion/FermionCore.h>
 | |
| #include <Grid/qcd/action/fermion/CayleyFermion5D.h>
 | |
| 
 | |
| 
 | |
| namespace Grid {
 | |
| namespace QCD {
 | |
| 
 | |
|   // FIXME -- make a version of these routines with site loop outermost for cache reuse.
 | |
| 
 | |
|   // Pminus fowards
 | |
|   // Pplus  backwards..
 | |
| template<class Impl>  
 | |
| void CayleyFermion5D<Impl>::M5D(const FermionField &psi,
 | |
| 				const FermionField &phi, 
 | |
| 				FermionField &chi,
 | |
| 				std::vector<Coeff_t> &lower,
 | |
| 				std::vector<Coeff_t> &diag,
 | |
| 				std::vector<Coeff_t> &upper)
 | |
| {
 | |
|   int Ls =this->Ls;
 | |
|   GridBase *grid=psi._grid;
 | |
|   assert(phi.checkerboard == psi.checkerboard);
 | |
|   chi.checkerboard=psi.checkerboard;
 | |
|   // Flops = 6.0*(Nc*Ns) *Ls*vol
 | |
|   M5Dcalls++;
 | |
|   M5Dtime-=usecond();
 | |
| 
 | |
|   parallel_for(int ss=0;ss<grid->oSites();ss+=Ls){ // adds Ls
 | |
|     for(int s=0;s<Ls;s++){
 | |
|       auto tmp = psi._odata[0];
 | |
|       if ( s==0 ) {
 | |
|  	                            spProj5m(tmp,psi._odata[ss+s+1]);
 | |
| 	chi[ss+s]=diag[s]*phi[ss+s]+upper[s]*tmp;
 | |
| 
 | |
| 	                    spProj5p(tmp,psi._odata[ss+Ls-1]);
 | |
| 	chi[ss+s]=chi[ss+s]+lower[s]*tmp;
 | |
|       } else if ( s==(Ls-1)) {
 | |
| 	                            spProj5m(tmp,psi._odata[ss+0]);
 | |
| 	chi[ss+s]=diag[s]*phi[ss+s]+upper[s]*tmp;
 | |
| 
 | |
|  	                    spProj5p(tmp,psi._odata[ss+s-1]);
 | |
| 	chi[ss+s]=chi[ss+s]+lower[s]*tmp;
 | |
|       } else { 
 | |
| 	                            spProj5m(tmp,psi._odata[ss+s+1]);
 | |
| 	chi[ss+s]=diag[s]*phi[ss+s]+upper[s]*tmp;
 | |
| 
 | |
| 	                    spProj5p(tmp,psi._odata[ss+s-1]);
 | |
| 	chi[ss+s]=chi[ss+s]+lower[s]*tmp;
 | |
|       }
 | |
|     }
 | |
|   }
 | |
|   M5Dtime+=usecond();
 | |
| }
 | |
| 
 | |
| template<class Impl>  
 | |
| void CayleyFermion5D<Impl>::M5Ddag(const FermionField &psi,
 | |
| 				   const FermionField &phi, 
 | |
| 				   FermionField &chi,
 | |
| 				   std::vector<Coeff_t> &lower,
 | |
| 				   std::vector<Coeff_t> &diag,
 | |
| 				   std::vector<Coeff_t> &upper)
 | |
| {
 | |
|   int Ls =this->Ls;
 | |
|   GridBase *grid=psi._grid;
 | |
|   assert(phi.checkerboard == psi.checkerboard);
 | |
|   chi.checkerboard=psi.checkerboard;
 | |
| 
 | |
|   // Flops = 6.0*(Nc*Ns) *Ls*vol
 | |
|   M5Dcalls++;
 | |
|   M5Dtime-=usecond();
 | |
| 
 | |
|   parallel_for(int ss=0;ss<grid->oSites();ss+=Ls){ // adds Ls
 | |
|     auto tmp = psi._odata[0];
 | |
|     for(int s=0;s<Ls;s++){
 | |
|       if ( s==0 ) {
 | |
| 	spProj5p(tmp,psi._odata[ss+s+1]);
 | |
| 	chi[ss+s]=diag[s]*phi[ss+s]+upper[s]*tmp;
 | |
| 
 | |
| 	spProj5m(tmp,psi._odata[ss+Ls-1]);
 | |
| 	chi[ss+s]=chi[ss+s]+lower[s]*tmp;
 | |
|       } else if ( s==(Ls-1)) {
 | |
| 	spProj5p(tmp,psi._odata[ss+0]);
 | |
| 	chi[ss+s]=diag[s]*phi[ss+s]+upper[s]*tmp;
 | |
| 
 | |
| 	spProj5m(tmp,psi._odata[ss+s-1]);
 | |
| 	chi[ss+s]=chi[ss+s]+lower[s]*tmp;
 | |
|       } else { 
 | |
| 	spProj5p(tmp,psi._odata[ss+s+1]);
 | |
| 	chi[ss+s]=diag[s]*phi[ss+s]+upper[s]*tmp;
 | |
| 
 | |
| 	spProj5m(tmp,psi._odata[ss+s-1]);
 | |
| 	chi[ss+s]=chi[ss+s]+lower[s]*tmp;
 | |
|       }
 | |
|     }
 | |
|   }
 | |
|   M5Dtime+=usecond();
 | |
| }
 | |
| 
 | |
| template<class Impl>
 | |
| void CayleyFermion5D<Impl>::MooeeInv    (const FermionField &psi, FermionField &chi)
 | |
| {
 | |
|   GridBase *grid=psi._grid;
 | |
|   int Ls=this->Ls;
 | |
| 
 | |
|   chi.checkerboard=psi.checkerboard;
 | |
| 
 | |
|   MooeeInvCalls++;
 | |
|   MooeeInvTime-=usecond();
 | |
| 
 | |
|   parallel_for(int ss=0;ss<grid->oSites();ss+=Ls){ // adds Ls
 | |
|     auto tmp = psi._odata[0];
 | |
| 
 | |
|     // flops = 12*2*Ls + 12*2*Ls + 3*12*Ls + 12*2*Ls  = 12*Ls * (9) = 108*Ls flops
 | |
|     // Apply (L^{\prime})^{-1}
 | |
|     chi[ss]=psi[ss]; // chi[0]=psi[0]
 | |
|     for(int s=1;s<Ls;s++){
 | |
|                             spProj5p(tmp,chi[ss+s-1]);  
 | |
|       chi[ss+s] = psi[ss+s]-lee[s-1]*tmp;
 | |
|     }
 | |
|     // L_m^{-1} 
 | |
|     for (int s=0;s<Ls-1;s++){ // Chi[ee] = 1 - sum[s<Ls-1] -leem[s]P_- chi
 | |
|                                    spProj5m(tmp,chi[ss+s]);    
 | |
|       chi[ss+Ls-1] = chi[ss+Ls-1] - leem[s]*tmp;
 | |
|     }
 | |
|     // U_m^{-1} D^{-1}
 | |
|     for (int s=0;s<Ls-1;s++){
 | |
|       // Chi[s] + 1/d chi[s] 
 | |
|                                                 spProj5p(tmp,chi[ss+Ls-1]); 
 | |
|       chi[ss+s] = (1.0/dee[s])*chi[ss+s]-(ueem[s]/dee[Ls-1])*tmp;
 | |
|     }	
 | |
|     chi[ss+Ls-1]= (1.0/dee[Ls-1])*chi[ss+Ls-1];
 | |
|       
 | |
|     // Apply U^{-1}
 | |
|     for (int s=Ls-2;s>=0;s--){
 | |
|                             spProj5m(tmp,chi[ss+s+1]);  
 | |
|       chi[ss+s] = chi[ss+s] - uee[s]*tmp;
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   MooeeInvTime+=usecond();
 | |
| 
 | |
| }
 | |
| 
 | |
| template<class Impl>
 | |
| void CayleyFermion5D<Impl>::MooeeInvDag (const FermionField &psi, FermionField &chi)
 | |
| {
 | |
|   GridBase *grid=psi._grid;
 | |
|   int Ls=this->Ls;
 | |
| 
 | |
|   assert(psi.checkerboard == psi.checkerboard);
 | |
|   chi.checkerboard=psi.checkerboard;
 | |
| 
 | |
|   std::vector<Coeff_t> ueec(Ls);
 | |
|   std::vector<Coeff_t> deec(Ls);
 | |
|   std::vector<Coeff_t> leec(Ls);
 | |
|   std::vector<Coeff_t> ueemc(Ls);
 | |
|   std::vector<Coeff_t> leemc(Ls);
 | |
|   for(int s=0;s<ueec.size();s++){
 | |
|     ueec[s] = conjugate(uee[s]);
 | |
|     deec[s] = conjugate(dee[s]);
 | |
|     leec[s] = conjugate(lee[s]);
 | |
|     ueemc[s]= conjugate(ueem[s]);
 | |
|     leemc[s]= conjugate(leem[s]);
 | |
|   }
 | |
|   MooeeInvCalls++;
 | |
|   MooeeInvTime-=usecond();
 | |
| 
 | |
|   parallel_for(int ss=0;ss<grid->oSites();ss+=Ls){ // adds Ls
 | |
| 
 | |
|     auto tmp = psi._odata[0];
 | |
| 
 | |
|     // Apply (U^{\prime})^{-dagger}
 | |
|     chi[ss]=psi[ss];
 | |
|     for (int s=1;s<Ls;s++){
 | |
|                             spProj5m(tmp,chi[ss+s-1]);
 | |
|       chi[ss+s] = psi[ss+s]-ueec[s-1]*tmp;
 | |
|     }
 | |
|     // U_m^{-\dagger} 
 | |
|     for (int s=0;s<Ls-1;s++){
 | |
|                                    spProj5p(tmp,chi[ss+s]);
 | |
|       chi[ss+Ls-1] = chi[ss+Ls-1] - ueemc[s]*tmp;
 | |
|     }
 | |
| 
 | |
|     // L_m^{-\dagger} D^{-dagger}
 | |
|     for (int s=0;s<Ls-1;s++){
 | |
|       spProj5m(tmp,chi[ss+Ls-1]);
 | |
|       chi[ss+s] = (1.0/deec[s])*chi[ss+s]-(leemc[s]/deec[Ls-1])*tmp;
 | |
|     }	
 | |
|     chi[ss+Ls-1]= (1.0/deec[Ls-1])*chi[ss+Ls-1];
 | |
|   
 | |
|     // Apply L^{-dagger}
 | |
|     for (int s=Ls-2;s>=0;s--){
 | |
|       spProj5p(tmp,chi[ss+s+1]);
 | |
|       chi[ss+s] = chi[ss+s] - leec[s]*tmp;
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   MooeeInvTime+=usecond();
 | |
| 
 | |
| }
 | |
| 
 | |
| #ifdef CAYLEY_DPERP_CACHE
 | |
|   INSTANTIATE_DPERP(WilsonImplF);
 | |
|   INSTANTIATE_DPERP(WilsonImplD);
 | |
|   INSTANTIATE_DPERP(GparityWilsonImplF);
 | |
|   INSTANTIATE_DPERP(GparityWilsonImplD);
 | |
|   INSTANTIATE_DPERP(ZWilsonImplF);
 | |
|   INSTANTIATE_DPERP(ZWilsonImplD);
 | |
| 
 | |
|   INSTANTIATE_DPERP(WilsonImplFH);
 | |
|   INSTANTIATE_DPERP(WilsonImplDF);
 | |
|   INSTANTIATE_DPERP(GparityWilsonImplFH);
 | |
|   INSTANTIATE_DPERP(GparityWilsonImplDF);
 | |
|   INSTANTIATE_DPERP(ZWilsonImplFH);
 | |
|   INSTANTIATE_DPERP(ZWilsonImplDF);
 | |
| #endif
 | |
| 
 | |
| }}
 |