diff --git a/lib/qcd/action/fermion/MobiusEOFAFermionssp.cc b/lib/qcd/action/fermion/MobiusEOFAFermionssp.cc index c86bb995..7a6f44e9 100644 --- a/lib/qcd/action/fermion/MobiusEOFAFermionssp.cc +++ b/lib/qcd/action/fermion/MobiusEOFAFermionssp.cc @@ -28,263 +28,262 @@ with this program; if not, write to the Free Software Foundation, Inc., See the full license in the file "LICENSE" in the top level distribution directory *************************************************************************************/ -/* END LEGAL */ + /* END LEGAL */ #include #include -namespace Grid { -namespace QCD { +NAMESPACE_BEGIN(Grid); - // FIXME -- make a version of these routines with site loop outermost for cache reuse. - // Pminus fowards - // Pplus backwards - template - void MobiusEOFAFermion::M5D(const FermionField& psi, const FermionField& phi, - FermionField& chi, std::vector& lower, std::vector& diag, std::vector& upper) - { - Coeff_t one(1.0); - int Ls = this->Ls; - for(int s=0; s +void MobiusEOFAFermion::M5D(const FermionField& psi, const FermionField& phi, + FermionField& chi, std::vector& lower, std::vector& diag, std::vector& upper) +{ + Coeff_t one(1.0); + int Ls = this->Ls; + for(int s=0; s - void MobiusEOFAFermion::M5D_shift(const FermionField& psi, const FermionField& phi, - FermionField& chi, std::vector& lower, std::vector& diag, std::vector& upper, - std::vector& shift_coeffs) - { - Coeff_t one(1.0); - int Ls = this->Ls; - for(int s=0; spm == 1){ axpby_ssp_pplus(chi, one, chi, shift_coeffs[s], psi, s, Ls-1); } - else{ axpby_ssp_pminus(chi, one, chi, shift_coeffs[s], psi, s, 0); } +template +void MobiusEOFAFermion::M5D_shift(const FermionField& psi, const FermionField& phi, + FermionField& chi, std::vector& lower, std::vector& diag, std::vector& upper, + std::vector& shift_coeffs) +{ + Coeff_t one(1.0); + int Ls = this->Ls; + for(int s=0; spm == 1){ axpby_ssp_pplus(chi, one, chi, shift_coeffs[s], psi, s, Ls-1); } + else{ axpby_ssp_pminus(chi, one, chi, shift_coeffs[s], psi, s, 0); } + } +} + +template +void MobiusEOFAFermion::M5Ddag(const FermionField& psi, const FermionField& phi, + FermionField& chi, std::vector& lower, std::vector& diag, std::vector& upper) +{ + Coeff_t one(1.0); + int Ls = this->Ls; + for(int s=0; s - void MobiusEOFAFermion::M5Ddag(const FermionField& psi, const FermionField& phi, - FermionField& chi, std::vector& lower, std::vector& diag, std::vector& upper) - { - Coeff_t one(1.0); - int Ls = this->Ls; - for(int s=0; s +void MobiusEOFAFermion::M5Ddag_shift(const FermionField& psi, const FermionField& phi, + FermionField& chi, std::vector& lower, std::vector& diag, std::vector& upper, + std::vector& shift_coeffs) +{ + Coeff_t one(1.0); + int Ls = this->Ls; + for(int s=0; spm == 1){ axpby_ssp_pplus(chi, one, chi, shift_coeffs[s], psi, Ls-1, s); } + else{ axpby_ssp_pminus(chi, one, chi, shift_coeffs[s], psi, 0, s); } + } +} + +template +void MobiusEOFAFermion::MooeeInv(const FermionField& psi, FermionField& chi) +{ + if(this->shift != 0.0){ MooeeInv_shift(psi,chi); return; } + + Coeff_t one(1.0); + Coeff_t czero(0.0); + chi.checkerboard = psi.checkerboard; + int Ls = this->Ls; + + // Apply (L^{\prime})^{-1} + axpby_ssp(chi, one, psi, czero, psi, 0, 0); // chi[0]=psi[0] + for(int s=1; slee[s-1], chi, s, s-1);// recursion Psi[s] -lee P_+ chi[s-1] } - template - void MobiusEOFAFermion::M5Ddag_shift(const FermionField& psi, const FermionField& phi, - FermionField& chi, std::vector& lower, std::vector& diag, std::vector& upper, - std::vector& shift_coeffs) - { - Coeff_t one(1.0); - int Ls = this->Ls; - for(int s=0; spm == 1){ axpby_ssp_pplus(chi, one, chi, shift_coeffs[s], psi, Ls-1, s); } - else{ axpby_ssp_pminus(chi, one, chi, shift_coeffs[s], psi, 0, s); } - } + // L_m^{-1} + for(int s=0; sleem[s], chi, Ls-1, s); } - template - void MobiusEOFAFermion::MooeeInv(const FermionField& psi, FermionField& chi) - { - if(this->shift != 0.0){ MooeeInv_shift(psi,chi); return; } + // U_m^{-1} D^{-1} + for(int s=0; sdee[s], chi, -this->ueem[s]/this->dee[Ls-1], chi, s, Ls-1); + } + axpby_ssp(chi, one/this->dee[Ls-1], chi, czero, chi, Ls-1, Ls-1); - Coeff_t one(1.0); - Coeff_t czero(0.0); - chi.checkerboard = psi.checkerboard; - int Ls = this->Ls; + // Apply U^{-1} + for(int s=Ls-2; s>=0; s--){ + axpby_ssp_pminus(chi, one, chi, -this->uee[s], chi, s, s+1); // chi[Ls] + } +} - // Apply (L^{\prime})^{-1} - axpby_ssp(chi, one, psi, czero, psi, 0, 0); // chi[0]=psi[0] - for(int s=1; slee[s-1], chi, s, s-1);// recursion Psi[s] -lee P_+ chi[s-1] - } +template +void MobiusEOFAFermion::MooeeInv_shift(const FermionField& psi, FermionField& chi) +{ + Coeff_t one(1.0); + Coeff_t czero(0.0); + chi.checkerboard = psi.checkerboard; + int Ls = this->Ls; - // L_m^{-1} - for(int s=0; sleem[s], chi, Ls-1, s); - } + FermionField tmp(psi._grid); - // U_m^{-1} D^{-1} - for(int s=0; sdee[s], chi, -this->ueem[s]/this->dee[Ls-1], chi, s, Ls-1); - } - axpby_ssp(chi, one/this->dee[Ls-1], chi, czero, chi, Ls-1, Ls-1); - - // Apply U^{-1} - for(int s=Ls-2; s>=0; s--){ - axpby_ssp_pminus(chi, one, chi, -this->uee[s], chi, s, s+1); // chi[Ls] - } + // Apply (L^{\prime})^{-1} + axpby_ssp(chi, one, psi, czero, psi, 0, 0); // chi[0]=psi[0] + axpby_ssp(tmp, czero, tmp, this->MooeeInv_shift_lc[0], psi, 0, 0); + for(int s=1; slee[s-1], chi, s, s-1);// recursion Psi[s] -lee P_+ chi[s-1] + axpby_ssp(tmp, one, tmp, this->MooeeInv_shift_lc[s], psi, 0, s); } - template - void MobiusEOFAFermion::MooeeInv_shift(const FermionField& psi, FermionField& chi) - { - Coeff_t one(1.0); - Coeff_t czero(0.0); - chi.checkerboard = psi.checkerboard; - int Ls = this->Ls; - - FermionField tmp(psi._grid); - - // Apply (L^{\prime})^{-1} - axpby_ssp(chi, one, psi, czero, psi, 0, 0); // chi[0]=psi[0] - axpby_ssp(tmp, czero, tmp, this->MooeeInv_shift_lc[0], psi, 0, 0); - for(int s=1; slee[s-1], chi, s, s-1);// recursion Psi[s] -lee P_+ chi[s-1] - axpby_ssp(tmp, one, tmp, this->MooeeInv_shift_lc[s], psi, 0, s); - } - - // L_m^{-1} - for(int s=0; sleem[s], chi, Ls-1, s); - } - - // U_m^{-1} D^{-1} - for(int s=0; sdee[s], chi, -this->ueem[s]/this->dee[Ls-1], chi, s, Ls-1); - } - axpby_ssp(chi, one/this->dee[Ls-1], chi, czero, chi, Ls-1, Ls-1); - - // Apply U^{-1} and add shift term - if(this->pm == 1){ axpby_ssp_pplus(chi, one, chi, this->MooeeInv_shift_norm[Ls-1], tmp, Ls-1, 0); } - else{ axpby_ssp_pminus(chi, one, chi, this->MooeeInv_shift_norm[Ls-1], tmp, Ls-1, 0); } - for(int s=Ls-2; s>=0; s--){ - axpby_ssp_pminus(chi, one, chi, -this->uee[s], chi, s, s+1); // chi[Ls] - if(this->pm == 1){ axpby_ssp_pplus(chi, one, chi, this->MooeeInv_shift_norm[s], tmp, s, 0); } - else{ axpby_ssp_pminus(chi, one, chi, this->MooeeInv_shift_norm[s], tmp, s, 0); } - } + // L_m^{-1} + for(int s=0; sleem[s], chi, Ls-1, s); } - template - void MobiusEOFAFermion::MooeeInvDag(const FermionField& psi, FermionField& chi) - { - if(this->shift != 0.0){ MooeeInvDag_shift(psi,chi); return; } + // U_m^{-1} D^{-1} + for(int s=0; sdee[s], chi, -this->ueem[s]/this->dee[Ls-1], chi, s, Ls-1); + } + axpby_ssp(chi, one/this->dee[Ls-1], chi, czero, chi, Ls-1, Ls-1); - Coeff_t one(1.0); - Coeff_t czero(0.0); - chi.checkerboard = psi.checkerboard; - int Ls = this->Ls; + // Apply U^{-1} and add shift term + if(this->pm == 1){ axpby_ssp_pplus(chi, one, chi, this->MooeeInv_shift_norm[Ls-1], tmp, Ls-1, 0); } + else{ axpby_ssp_pminus(chi, one, chi, this->MooeeInv_shift_norm[Ls-1], tmp, Ls-1, 0); } + for(int s=Ls-2; s>=0; s--){ + axpby_ssp_pminus(chi, one, chi, -this->uee[s], chi, s, s+1); // chi[Ls] + if(this->pm == 1){ axpby_ssp_pplus(chi, one, chi, this->MooeeInv_shift_norm[s], tmp, s, 0); } + else{ axpby_ssp_pminus(chi, one, chi, this->MooeeInv_shift_norm[s], tmp, s, 0); } + } +} - // Apply (U^{\prime})^{-dagger} - axpby_ssp(chi, one, psi, czero, psi, 0, 0); // chi[0]=psi[0] - for(int s=1; suee[s-1]), chi, s, s-1); - } +template +void MobiusEOFAFermion::MooeeInvDag(const FermionField& psi, FermionField& chi) +{ + if(this->shift != 0.0){ MooeeInvDag_shift(psi,chi); return; } - // U_m^{-\dagger} - for(int s=0; sueem[s]), chi, Ls-1, s); - } + Coeff_t one(1.0); + Coeff_t czero(0.0); + chi.checkerboard = psi.checkerboard; + int Ls = this->Ls; - // L_m^{-\dagger} D^{-dagger} - for(int s=0; sdee[s]), chi, -conjugate(this->leem[s]/this->dee[Ls-1]), chi, s, Ls-1); - } - axpby_ssp(chi, one/conjugate(this->dee[Ls-1]), chi, czero, chi, Ls-1, Ls-1); - - // Apply L^{-dagger} - for(int s=Ls-2; s>=0; s--){ - axpby_ssp_pplus(chi, one, chi, -conjugate(this->lee[s]), chi, s, s+1); // chi[Ls] - } + // Apply (U^{\prime})^{-dagger} + axpby_ssp(chi, one, psi, czero, psi, 0, 0); // chi[0]=psi[0] + for(int s=1; suee[s-1]), chi, s, s-1); } - template - void MobiusEOFAFermion::MooeeInvDag_shift(const FermionField& psi, FermionField& chi) - { - Coeff_t one(1.0); - Coeff_t czero(0.0); - chi.checkerboard = psi.checkerboard; - int Ls = this->Ls; - - FermionField tmp(psi._grid); - - // Apply (U^{\prime})^{-dagger} and accumulate (MooeeInvDag_shift_lc)_{j} \psi_{j} in tmp[0] - axpby_ssp(chi, one, psi, czero, psi, 0, 0); // chi[0]=psi[0] - axpby_ssp(tmp, czero, tmp, this->MooeeInvDag_shift_lc[0], psi, 0, 0); - for(int s=1; suee[s-1]), chi, s, s-1); - axpby_ssp(tmp, one, tmp, this->MooeeInvDag_shift_lc[s], psi, 0, s); - } - - // U_m^{-\dagger} - for(int s=0; sueem[s]), chi, Ls-1, s); - } - - // L_m^{-\dagger} D^{-dagger} - for(int s=0; sdee[s]), chi, -conjugate(this->leem[s]/this->dee[Ls-1]), chi, s, Ls-1); - } - axpby_ssp(chi, one/conjugate(this->dee[Ls-1]), chi, czero, chi, Ls-1, Ls-1); - - // Apply L^{-dagger} and add shift - if(this->pm == 1){ axpby_ssp_pplus(chi, one, chi, this->MooeeInvDag_shift_norm[Ls-1], tmp, Ls-1, 0); } - else{ axpby_ssp_pminus(chi, one, chi, this->MooeeInvDag_shift_norm[Ls-1], tmp, Ls-1, 0); } - for(int s=Ls-2; s>=0; s--){ - axpby_ssp_pplus(chi, one, chi, -conjugate(this->lee[s]), chi, s, s+1); // chi[Ls] - if(this->pm == 1){ axpby_ssp_pplus(chi, one, chi, this->MooeeInvDag_shift_norm[s], tmp, s, 0); } - else{ axpby_ssp_pminus(chi, one, chi, this->MooeeInvDag_shift_norm[s], tmp, s, 0); } - } + // U_m^{-\dagger} + for(int s=0; sueem[s]), chi, Ls-1, s); } - #ifdef MOBIUS_EOFA_DPERP_LINALG + // L_m^{-\dagger} D^{-dagger} + for(int s=0; sdee[s]), chi, -conjugate(this->leem[s]/this->dee[Ls-1]), chi, s, Ls-1); + } + axpby_ssp(chi, one/conjugate(this->dee[Ls-1]), chi, czero, chi, Ls-1, Ls-1); - INSTANTIATE_DPERP_MOBIUS_EOFA(WilsonImplF); - INSTANTIATE_DPERP_MOBIUS_EOFA(WilsonImplD); - INSTANTIATE_DPERP_MOBIUS_EOFA(GparityWilsonImplF); - INSTANTIATE_DPERP_MOBIUS_EOFA(GparityWilsonImplD); - INSTANTIATE_DPERP_MOBIUS_EOFA(ZWilsonImplF); - INSTANTIATE_DPERP_MOBIUS_EOFA(ZWilsonImplD); + // Apply L^{-dagger} + for(int s=Ls-2; s>=0; s--){ + axpby_ssp_pplus(chi, one, chi, -conjugate(this->lee[s]), chi, s, s+1); // chi[Ls] + } +} - INSTANTIATE_DPERP_MOBIUS_EOFA(WilsonImplFH); - INSTANTIATE_DPERP_MOBIUS_EOFA(WilsonImplDF); - INSTANTIATE_DPERP_MOBIUS_EOFA(GparityWilsonImplFH); - INSTANTIATE_DPERP_MOBIUS_EOFA(GparityWilsonImplDF); - INSTANTIATE_DPERP_MOBIUS_EOFA(ZWilsonImplFH); - INSTANTIATE_DPERP_MOBIUS_EOFA(ZWilsonImplDF); +template +void MobiusEOFAFermion::MooeeInvDag_shift(const FermionField& psi, FermionField& chi) +{ + Coeff_t one(1.0); + Coeff_t czero(0.0); + chi.checkerboard = psi.checkerboard; + int Ls = this->Ls; - #endif + FermionField tmp(psi._grid); -}} + // Apply (U^{\prime})^{-dagger} and accumulate (MooeeInvDag_shift_lc)_{j} \psi_{j} in tmp[0] + axpby_ssp(chi, one, psi, czero, psi, 0, 0); // chi[0]=psi[0] + axpby_ssp(tmp, czero, tmp, this->MooeeInvDag_shift_lc[0], psi, 0, 0); + for(int s=1; suee[s-1]), chi, s, s-1); + axpby_ssp(tmp, one, tmp, this->MooeeInvDag_shift_lc[s], psi, 0, s); + } + + // U_m^{-\dagger} + for(int s=0; sueem[s]), chi, Ls-1, s); + } + + // L_m^{-\dagger} D^{-dagger} + for(int s=0; sdee[s]), chi, -conjugate(this->leem[s]/this->dee[Ls-1]), chi, s, Ls-1); + } + axpby_ssp(chi, one/conjugate(this->dee[Ls-1]), chi, czero, chi, Ls-1, Ls-1); + + // Apply L^{-dagger} and add shift + if(this->pm == 1){ axpby_ssp_pplus(chi, one, chi, this->MooeeInvDag_shift_norm[Ls-1], tmp, Ls-1, 0); } + else{ axpby_ssp_pminus(chi, one, chi, this->MooeeInvDag_shift_norm[Ls-1], tmp, Ls-1, 0); } + for(int s=Ls-2; s>=0; s--){ + axpby_ssp_pplus(chi, one, chi, -conjugate(this->lee[s]), chi, s, s+1); // chi[Ls] + if(this->pm == 1){ axpby_ssp_pplus(chi, one, chi, this->MooeeInvDag_shift_norm[s], tmp, s, 0); } + else{ axpby_ssp_pminus(chi, one, chi, this->MooeeInvDag_shift_norm[s], tmp, s, 0); } + } +} + +#ifdef MOBIUS_EOFA_DPERP_LINALG + +INSTANTIATE_DPERP_MOBIUS_EOFA(WilsonImplF); +INSTANTIATE_DPERP_MOBIUS_EOFA(WilsonImplD); +INSTANTIATE_DPERP_MOBIUS_EOFA(GparityWilsonImplF); +INSTANTIATE_DPERP_MOBIUS_EOFA(GparityWilsonImplD); +INSTANTIATE_DPERP_MOBIUS_EOFA(ZWilsonImplF); +INSTANTIATE_DPERP_MOBIUS_EOFA(ZWilsonImplD); + +INSTANTIATE_DPERP_MOBIUS_EOFA(WilsonImplFH); +INSTANTIATE_DPERP_MOBIUS_EOFA(WilsonImplDF); +INSTANTIATE_DPERP_MOBIUS_EOFA(GparityWilsonImplFH); +INSTANTIATE_DPERP_MOBIUS_EOFA(GparityWilsonImplDF); +INSTANTIATE_DPERP_MOBIUS_EOFA(ZWilsonImplFH); +INSTANTIATE_DPERP_MOBIUS_EOFA(ZWilsonImplDF); + +#endif + +NAMESPACE_END(Grid);