/************************************************************************************* Grid physics library, www.github.com/paboyle/Grid Source file: ./lib/qcd/action/fermion/CayleyFermion5D.cc Copyright (C) 2015 Author: Peter Boyle Author: Peter Boyle Author: Peter Boyle Author: paboyle This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 2 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. See the full license in the file "LICENSE" in the top level distribution directory *************************************************************************************/ /* END LEGAL */ #include #include namespace Grid { namespace QCD { // FIXME -- make a version of these routines with site loop outermost for cache reuse. // Pminus fowards // Pplus backwards.. template void CayleyFermion5D::M5D(const FermionField &psi, const FermionField &phi, FermionField &chi, std::vector &lower, std::vector &diag, std::vector &upper) { int Ls =this->Ls; GridBase *grid=psi._grid; assert(phi.checkerboard == psi.checkerboard); chi.checkerboard=psi.checkerboard; // Flops = 6.0*(Nc*Ns) *Ls*vol M5Dcalls++; M5Dtime-=usecond(); parallel_for(int ss=0;ssoSites();ss+=Ls){ // adds Ls for(int s=0;s void CayleyFermion5D::M5Ddag(const FermionField &psi, const FermionField &phi, FermionField &chi, std::vector &lower, std::vector &diag, std::vector &upper) { int Ls =this->Ls; GridBase *grid=psi._grid; assert(phi.checkerboard == psi.checkerboard); chi.checkerboard=psi.checkerboard; // Flops = 6.0*(Nc*Ns) *Ls*vol M5Dcalls++; M5Dtime-=usecond(); parallel_for(int ss=0;ssoSites();ss+=Ls){ // adds Ls auto tmp = psi._odata[0]; for(int s=0;s void CayleyFermion5D::MooeeInv (const FermionField &psi, FermionField &chi) { GridBase *grid=psi._grid; int Ls=this->Ls; chi.checkerboard=psi.checkerboard; MooeeInvCalls++; MooeeInvTime-=usecond(); parallel_for(int ss=0;ssoSites();ss+=Ls){ // adds Ls auto tmp = psi._odata[0]; // flops = 12*2*Ls + 12*2*Ls + 3*12*Ls + 12*2*Ls = 12*Ls * (9) = 108*Ls flops // Apply (L^{\prime})^{-1} chi[ss]=psi[ss]; // chi[0]=psi[0] for(int s=1;s=0;s--){ spProj5m(tmp,chi[ss+s+1]); chi[ss+s] = chi[ss+s] - uee[s]*tmp; } } MooeeInvTime+=usecond(); } template void CayleyFermion5D::MooeeInvDag (const FermionField &psi, FermionField &chi) { GridBase *grid=psi._grid; int Ls=this->Ls; assert(psi.checkerboard == psi.checkerboard); chi.checkerboard=psi.checkerboard; std::vector ueec(Ls); std::vector deec(Ls); std::vector leec(Ls); std::vector ueemc(Ls); std::vector leemc(Ls); for(int s=0;soSites();ss+=Ls){ // adds Ls auto tmp = psi._odata[0]; // Apply (U^{\prime})^{-dagger} chi[ss]=psi[ss]; for (int s=1;s=0;s--){ spProj5p(tmp,chi[ss+s+1]); chi[ss+s] = chi[ss+s] - leec[s]*tmp; } } MooeeInvTime+=usecond(); } #ifdef CAYLEY_DPERP_CACHE INSTANTIATE_DPERP(WilsonImplF); INSTANTIATE_DPERP(WilsonImplD); INSTANTIATE_DPERP(GparityWilsonImplF); INSTANTIATE_DPERP(GparityWilsonImplD); INSTANTIATE_DPERP(ZWilsonImplF); INSTANTIATE_DPERP(ZWilsonImplD); #endif }}