1
0
mirror of https://github.com/paboyle/Grid.git synced 2024-11-14 09:45:36 +00:00
Grid/lib/qcd/action/fermion/WilsonKernels.cc

557 lines
14 KiB
C++
Raw Normal View History

/*************************************************************************************
Grid physics library, www.github.com/paboyle/Grid
Source file: ./lib/qcd/action/fermion/WilsonKernels.cc
Copyright (C) 2015
Author: Peter Boyle <paboyle@ph.ed.ac.uk>
Author: Peter Boyle <peterboyle@Peters-MacBook-Pro-2.local>
Author: paboyle <paboyle@ph.ed.ac.uk>
This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation; either version 2 of the License, or
(at your option) any later version.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License along
with this program; if not, write to the Free Software Foundation, Inc.,
51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
See the full license in the file "LICENSE" in the top level distribution directory
*************************************************************************************/
/* END LEGAL */
#include <Grid.h>
namespace Grid {
namespace QCD {
2016-06-03 11:24:26 +01:00
int WilsonKernelsStatic::HandOpt;
int WilsonKernelsStatic::AsmOpt;
template<class Impl>
WilsonKernels<Impl>::WilsonKernels(const ImplParams &p): Base(p) {};
2016-06-03 11:24:26 +01:00
template<class Impl>
void WilsonKernels<Impl>::DiracOptDhopSite(StencilImpl &st,DoubledGaugeField &U,
std::vector<SiteHalfSpinor,alignedAllocator<SiteHalfSpinor> > &buf,
int sF,int sU,const FermionField &in, FermionField &out)
{
if ( AsmOpt ) WilsonKernels<Impl>::DiracOptAsmDhopSite(st,U,buf,sF,sU,in,out);
else if (HandOpt) WilsonKernels<Impl>::DiracOptHandDhopSite(st,U,buf,sF,sU,in,out);
else WilsonKernels<Impl>::DiracOptGenericDhopSite(st,U,buf,sF,sU,in,out);
}
template<class Impl>
void WilsonKernels<Impl>::DiracOptDhopSiteDag(StencilImpl &st,DoubledGaugeField &U,
std::vector<SiteHalfSpinor,alignedAllocator<SiteHalfSpinor> > &buf,
2016-03-27 05:24:07 +01:00
int sF,int sU,const FermionField &in, FermionField &out)
2016-06-03 11:24:26 +01:00
{
// No asm implementation yet.
// if ( AsmOpt ) WilsonKernels<Impl>::DiracOptAsmDhopSiteDag(st,U,buf,sF,sU,in,out);
// else
if (HandOpt) WilsonKernels<Impl>::DiracOptHandDhopSiteDag(st,U,buf,sF,sU,in,out);
else WilsonKernels<Impl>::DiracOptGenericDhopSiteDag(st,U,buf,sF,sU,in,out);
}
////////////////////////////////////////////
// Generic implementation; move to different file?
////////////////////////////////////////////
template<class Impl>
void WilsonKernels<Impl>::DiracOptGenericDhopSiteDag(StencilImpl &st,DoubledGaugeField &U,
std::vector<SiteHalfSpinor,alignedAllocator<SiteHalfSpinor> > &buf,
int sF,int sU,const FermionField &in, FermionField &out)
{
SiteHalfSpinor tmp;
SiteHalfSpinor chi;
2016-03-27 05:24:07 +01:00
SiteHalfSpinor *chi_p;
SiteHalfSpinor Uchi;
SiteSpinor result;
StencilEntry *SE;
int ptype;
2016-01-03 01:38:11 +00:00
///////////////////////////
// Xp
2016-01-03 01:38:11 +00:00
///////////////////////////
SE=st.GetEntry(ptype,Xp,sF);
2016-01-03 01:38:11 +00:00
2016-03-27 05:24:07 +01:00
if (SE->_is_local ) {
chi_p = &chi;
2016-01-03 01:38:11 +00:00
if ( SE->_permute ) {
spProjXp(tmp,in._odata[SE->_offset]);
permute(chi,tmp,ptype);
} else {
spProjXp(chi,in._odata[SE->_offset]);
}
2016-03-27 05:24:07 +01:00
} else {
chi_p=&buf[SE->_offset];
}
2016-01-03 01:38:11 +00:00
2016-03-27 05:24:07 +01:00
Impl::multLink(Uchi,U._odata[sU],*chi_p,Xp,SE,st);
spReconXp(result,Uchi);
2016-01-03 01:38:11 +00:00
///////////////////////////
// Yp
2016-01-03 01:38:11 +00:00
///////////////////////////
SE=st.GetEntry(ptype,Yp,sF);
2016-01-03 01:38:11 +00:00
2016-03-27 05:24:07 +01:00
if ( SE->_is_local ) {
chi_p = &chi;
2016-01-03 01:38:11 +00:00
if ( SE->_permute ) {
spProjYp(tmp,in._odata[SE->_offset]);
permute(chi,tmp,ptype);
} else {
spProjYp(chi,in._odata[SE->_offset]);
}
2016-03-27 05:24:07 +01:00
} else {
chi_p=&buf[SE->_offset];
2016-01-03 01:38:11 +00:00
}
2016-03-27 05:24:07 +01:00
Impl::multLink(Uchi,U._odata[sU],*chi_p,Yp,SE,st);
accumReconYp(result,Uchi);
2016-01-03 01:38:11 +00:00
///////////////////////////
// Zp
2016-01-03 01:38:11 +00:00
///////////////////////////
SE=st.GetEntry(ptype,Zp,sF);
2016-01-03 01:38:11 +00:00
2016-03-27 05:24:07 +01:00
if ( SE->_is_local ) {
chi_p = &chi;
2016-01-03 01:38:11 +00:00
if ( SE->_permute ) {
spProjZp(tmp,in._odata[SE->_offset]);
permute(chi,tmp,ptype);
} else {
spProjZp(chi,in._odata[SE->_offset]);
}
2016-03-27 05:24:07 +01:00
} else {
chi_p=&buf[SE->_offset];
2016-01-03 01:38:11 +00:00
}
2016-03-27 05:24:07 +01:00
Impl::multLink(Uchi,U._odata[sU],*chi_p,Zp,SE,st);
accumReconZp(result,Uchi);
2016-01-03 01:38:11 +00:00
///////////////////////////
// Tp
2016-01-03 01:38:11 +00:00
///////////////////////////
SE=st.GetEntry(ptype,Tp,sF);
2016-01-03 01:38:11 +00:00
2016-03-27 05:24:07 +01:00
if ( SE->_is_local ) {
chi_p = &chi;
2016-01-03 01:38:11 +00:00
if ( SE->_permute ) {
spProjTp(tmp,in._odata[SE->_offset]);
permute(chi,tmp,ptype);
} else {
spProjTp(chi,in._odata[SE->_offset]);
}
2016-03-27 05:24:07 +01:00
} else {
chi_p=&buf[SE->_offset];
2016-01-03 01:38:11 +00:00
}
2016-03-27 05:24:07 +01:00
Impl::multLink(Uchi,U._odata[sU],*chi_p,Tp,SE,st);
accumReconTp(result,Uchi);
2016-01-03 01:38:11 +00:00
///////////////////////////
// Xm
2016-01-03 01:38:11 +00:00
///////////////////////////
SE=st.GetEntry(ptype,Xm,sF);
2016-01-03 01:38:11 +00:00
2016-03-27 05:24:07 +01:00
if ( SE->_is_local ) {
chi_p = &chi;
2016-01-03 01:38:11 +00:00
if ( SE->_permute ) {
spProjXm(tmp,in._odata[SE->_offset]);
permute(chi,tmp,ptype);
} else {
spProjXm(chi,in._odata[SE->_offset]);
}
2016-03-27 05:24:07 +01:00
} else {
chi_p=&buf[SE->_offset];
2016-01-03 01:38:11 +00:00
}
2016-03-27 05:24:07 +01:00
Impl::multLink(Uchi,U._odata[sU],*chi_p,Xm,SE,st);
accumReconXm(result,Uchi);
2016-01-03 01:38:11 +00:00
///////////////////////////
// Ym
2016-01-03 01:38:11 +00:00
///////////////////////////
SE=st.GetEntry(ptype,Ym,sF);
2016-01-03 01:38:11 +00:00
2016-03-27 05:24:07 +01:00
if ( SE->_is_local ) {
chi_p = &chi;
2016-01-03 01:38:11 +00:00
if ( SE->_permute ) {
spProjYm(tmp,in._odata[SE->_offset]);
permute(chi,tmp,ptype);
} else {
spProjYm(chi,in._odata[SE->_offset]);
}
2016-03-27 05:24:07 +01:00
} else {
chi_p=&buf[SE->_offset];
2016-01-03 01:38:11 +00:00
}
2016-03-27 05:24:07 +01:00
Impl::multLink(Uchi,U._odata[sU],*chi_p,Ym,SE,st);
accumReconYm(result,Uchi);
2016-01-03 01:38:11 +00:00
///////////////////////////
// Zm
2016-01-03 01:38:11 +00:00
///////////////////////////
SE=st.GetEntry(ptype,Zm,sF);
2016-01-03 01:38:11 +00:00
2016-03-27 05:24:07 +01:00
if ( SE->_is_local ) {
chi_p = &chi;
2016-01-03 01:38:11 +00:00
if ( SE->_permute ) {
spProjZm(tmp,in._odata[SE->_offset]);
permute(chi,tmp,ptype);
} else {
spProjZm(chi,in._odata[SE->_offset]);
}
2016-03-27 05:24:07 +01:00
} else {
chi_p=&buf[SE->_offset];
2016-01-03 01:38:11 +00:00
}
2016-03-27 05:24:07 +01:00
Impl::multLink(Uchi,U._odata[sU],*chi_p,Zm,SE,st);
accumReconZm(result,Uchi);
2016-01-03 01:38:11 +00:00
///////////////////////////
// Tm
2016-01-03 01:38:11 +00:00
///////////////////////////
SE=st.GetEntry(ptype,Tm,sF);
2016-01-03 01:38:11 +00:00
2016-03-27 05:24:07 +01:00
if ( SE->_is_local ) {
chi_p = &chi;
2016-01-03 01:38:11 +00:00
if ( SE->_permute ) {
spProjTm(tmp,in._odata[SE->_offset]);
permute(chi,tmp,ptype);
} else {
spProjTm(chi,in._odata[SE->_offset]);
}
2016-03-27 05:24:07 +01:00
} else {
chi_p=&buf[SE->_offset];
2016-01-03 01:38:11 +00:00
}
2016-03-27 05:24:07 +01:00
Impl::multLink(Uchi,U._odata[sU],*chi_p,Tm,SE,st);
accumReconTm(result,Uchi);
2016-03-27 05:24:07 +01:00
vstream(out._odata[sF],result);
};
2016-01-03 01:38:11 +00:00
// Need controls to do interior, exterior, or both
template<class Impl>
2016-06-03 11:24:26 +01:00
void WilsonKernels<Impl>::DiracOptGenericDhopSite(StencilImpl &st,DoubledGaugeField &U,
std::vector<SiteHalfSpinor,alignedAllocator<SiteHalfSpinor> > &buf,
int sF,int sU,const FermionField &in, FermionField &out)
{
SiteHalfSpinor tmp;
SiteHalfSpinor chi;
2016-03-27 05:24:07 +01:00
SiteHalfSpinor *chi_p;
SiteHalfSpinor Uchi;
2016-01-03 01:38:11 +00:00
SiteSpinor result;
StencilEntry *SE;
int ptype;
2016-01-03 01:38:11 +00:00
///////////////////////////
// Xp
2016-01-03 01:38:11 +00:00
///////////////////////////
SE=st.GetEntry(ptype,Xm,sF);
2016-01-03 01:38:11 +00:00
2016-03-27 05:24:07 +01:00
if ( SE->_is_local ) {
chi_p = &chi;
2016-01-03 01:38:11 +00:00
if ( SE->_permute ) {
spProjXp(tmp,in._odata[SE->_offset]);
permute(chi,tmp,ptype);
} else {
spProjXp(chi,in._odata[SE->_offset]);
}
2016-03-27 05:24:07 +01:00
} else {
chi_p=&buf[SE->_offset];
2016-01-03 01:38:11 +00:00
}
2016-03-27 05:24:07 +01:00
Impl::multLink(Uchi,U._odata[sU],*chi_p,Xm,SE,st);
spReconXp(result,Uchi);
2016-01-03 01:38:11 +00:00
///////////////////////////
// Yp
2016-01-03 01:38:11 +00:00
///////////////////////////
SE=st.GetEntry(ptype,Ym,sF);
2016-01-03 01:38:11 +00:00
2016-03-27 05:24:07 +01:00
if ( SE->_is_local ) {
chi_p = &chi;
2016-01-03 01:38:11 +00:00
if ( SE->_permute ) {
spProjYp(tmp,in._odata[SE->_offset]);
permute(chi,tmp,ptype);
} else {
spProjYp(chi,in._odata[SE->_offset]);
}
2016-03-27 05:24:07 +01:00
} else {
chi_p=&buf[SE->_offset];
2016-01-03 01:38:11 +00:00
}
2016-03-27 05:24:07 +01:00
Impl::multLink(Uchi,U._odata[sU],*chi_p,Ym,SE,st);
accumReconYp(result,Uchi);
2016-01-03 01:38:11 +00:00
///////////////////////////
// Zp
2016-01-03 01:38:11 +00:00
///////////////////////////
SE=st.GetEntry(ptype,Zm,sF);
2016-01-03 01:38:11 +00:00
2016-03-27 05:24:07 +01:00
if ( SE->_is_local ) {
chi_p = &chi;
2016-01-03 01:38:11 +00:00
if ( SE->_permute ) {
spProjZp(tmp,in._odata[SE->_offset]);
permute(chi,tmp,ptype);
} else {
spProjZp(chi,in._odata[SE->_offset]);
}
2016-03-27 05:24:07 +01:00
} else {
chi_p=&buf[SE->_offset];
2016-01-03 01:38:11 +00:00
}
2016-03-27 05:24:07 +01:00
Impl::multLink(Uchi,U._odata[sU],*chi_p,Zm,SE,st);
accumReconZp(result,Uchi);
2016-01-03 01:38:11 +00:00
///////////////////////////
// Tp
2016-01-03 01:38:11 +00:00
///////////////////////////
SE=st.GetEntry(ptype,Tm,sF);
2016-01-03 01:38:11 +00:00
2016-03-27 05:24:07 +01:00
if ( SE->_is_local ) {
chi_p = &chi;
2016-01-03 01:38:11 +00:00
if ( SE->_permute ) {
spProjTp(tmp,in._odata[SE->_offset]);
permute(chi,tmp,ptype);
} else {
spProjTp(chi,in._odata[SE->_offset]);
}
2016-03-27 05:24:07 +01:00
} else {
chi_p=&buf[SE->_offset];
2016-01-03 01:38:11 +00:00
}
2016-03-27 05:24:07 +01:00
Impl::multLink(Uchi,U._odata[sU],*chi_p,Tm,SE,st);
accumReconTp(result,Uchi);
2016-01-03 01:38:11 +00:00
///////////////////////////
// Xm
2016-01-03 01:38:11 +00:00
///////////////////////////
SE=st.GetEntry(ptype,Xp,sF);
2016-01-03 01:38:11 +00:00
2016-03-27 05:24:07 +01:00
if ( SE->_is_local ) {
chi_p = &chi;
2016-01-03 01:38:11 +00:00
if ( SE->_permute ) {
spProjXm(tmp,in._odata[SE->_offset]);
permute(chi,tmp,ptype);
} else {
spProjXm(chi,in._odata[SE->_offset]);
}
2016-03-27 05:24:07 +01:00
} else {
chi_p=&buf[SE->_offset];
2016-01-03 01:38:11 +00:00
}
2016-03-27 05:24:07 +01:00
Impl::multLink(Uchi,U._odata[sU],*chi_p,Xp,SE,st);
accumReconXm(result,Uchi);
2016-01-03 01:38:11 +00:00
///////////////////////////
// Ym
2016-01-03 01:38:11 +00:00
///////////////////////////
SE=st.GetEntry(ptype,Yp,sF);
2016-01-03 01:38:11 +00:00
2016-03-27 05:24:07 +01:00
if ( SE->_is_local ) {
chi_p = &chi;
2016-01-03 01:38:11 +00:00
if ( SE->_permute ) {
spProjYm(tmp,in._odata[SE->_offset]);
permute(chi,tmp,ptype);
} else {
spProjYm(chi,in._odata[SE->_offset]);
}
2016-03-27 05:24:07 +01:00
} else {
chi_p=&buf[SE->_offset];
2016-01-03 01:38:11 +00:00
}
2016-03-27 05:24:07 +01:00
Impl::multLink(Uchi,U._odata[sU],*chi_p,Yp,SE,st);
accumReconYm(result,Uchi);
2016-01-03 01:38:11 +00:00
///////////////////////////
// Zm
2016-01-03 01:38:11 +00:00
///////////////////////////
SE=st.GetEntry(ptype,Zp,sF);
2016-01-03 01:38:11 +00:00
2016-03-27 05:24:07 +01:00
if ( SE->_is_local ) {
chi_p = &chi;
2016-01-03 01:38:11 +00:00
if ( SE->_permute ) {
spProjZm(tmp,in._odata[SE->_offset]);
permute(chi,tmp,ptype);
} else {
spProjZm(chi,in._odata[SE->_offset]);
}
2016-03-27 05:24:07 +01:00
} else {
chi_p=&buf[SE->_offset];
2016-01-03 01:38:11 +00:00
}
2016-03-27 05:24:07 +01:00
Impl::multLink(Uchi,U._odata[sU],*chi_p,Zp,SE,st);
accumReconZm(result,Uchi);
2016-01-03 01:38:11 +00:00
///////////////////////////
// Tm
2016-01-03 01:38:11 +00:00
///////////////////////////
SE=st.GetEntry(ptype,Tp,sF);
2016-01-03 01:38:11 +00:00
2016-03-27 05:24:07 +01:00
if ( SE->_is_local ) {
chi_p = &chi;
2016-01-03 01:38:11 +00:00
if ( SE->_permute ) {
spProjTm(tmp,in._odata[SE->_offset]);
permute(chi,tmp,ptype);
} else {
spProjTm(chi,in._odata[SE->_offset]);
}
2016-03-27 05:24:07 +01:00
} else {
chi_p=&buf[SE->_offset];
2016-01-03 01:38:11 +00:00
}
2016-03-27 05:24:07 +01:00
Impl::multLink(Uchi,U._odata[sU],*chi_p,Tp,SE,st);
accumReconTm(result,Uchi);
2016-01-03 01:38:11 +00:00
2016-03-27 05:24:07 +01:00
vstream(out._odata[sF],result);
2016-01-03 01:38:11 +00:00
};
template<class Impl>
void WilsonKernels<Impl>::DiracOptDhopDir(StencilImpl &st,DoubledGaugeField &U,
std::vector<SiteHalfSpinor,alignedAllocator<SiteHalfSpinor> > &buf,
int sF,int sU,const FermionField &in, FermionField &out,int dir,int gamma)
{
SiteHalfSpinor tmp;
SiteHalfSpinor chi;
SiteSpinor result;
SiteHalfSpinor Uchi;
StencilEntry *SE;
int ptype;
SE=st.GetEntry(ptype,dir,sF);
// Xp
if(gamma==Xp){
if ( SE->_is_local && SE->_permute ) {
spProjXp(tmp,in._odata[SE->_offset]);
permute(chi,tmp,ptype);
} else if ( SE->_is_local ) {
spProjXp(chi,in._odata[SE->_offset]);
} else {
chi=buf[SE->_offset];
}
Impl::multLink(Uchi,U._odata[sU],chi,dir,SE,st);
spReconXp(result,Uchi);
}
// Yp
if ( gamma==Yp ){
if ( SE->_is_local && SE->_permute ) {
spProjYp(tmp,in._odata[SE->_offset]);
permute(chi,tmp,ptype);
} else if ( SE->_is_local ) {
spProjYp(chi,in._odata[SE->_offset]);
} else {
chi=buf[SE->_offset];
}
Impl::multLink(Uchi,U._odata[sU],chi,dir,SE,st);
spReconYp(result,Uchi);
}
// Zp
if ( gamma ==Zp ){
if ( SE->_is_local && SE->_permute ) {
spProjZp(tmp,in._odata[SE->_offset]);
permute(chi,tmp,ptype);
} else if ( SE->_is_local ) {
spProjZp(chi,in._odata[SE->_offset]);
} else {
chi=buf[SE->_offset];
}
Impl::multLink(Uchi,U._odata[sU],chi,dir,SE,st);
spReconZp(result,Uchi);
}
// Tp
if ( gamma ==Tp ){
if ( SE->_is_local && SE->_permute ) {
spProjTp(tmp,in._odata[SE->_offset]);
permute(chi,tmp,ptype);
} else if ( SE->_is_local ) {
spProjTp(chi,in._odata[SE->_offset]);
} else {
chi=buf[SE->_offset];
}
Impl::multLink(Uchi,U._odata[sU],chi,dir,SE,st);
spReconTp(result,Uchi);
}
// Xm
if ( gamma==Xm ){
if ( SE->_is_local && SE->_permute ) {
spProjXm(tmp,in._odata[SE->_offset]);
permute(chi,tmp,ptype);
} else if ( SE->_is_local ) {
spProjXm(chi,in._odata[SE->_offset]);
} else {
chi=buf[SE->_offset];
}
Impl::multLink(Uchi,U._odata[sU],chi,dir,SE,st);
spReconXm(result,Uchi);
}
// Ym
if ( gamma == Ym ){
if ( SE->_is_local && SE->_permute ) {
spProjYm(tmp,in._odata[SE->_offset]);
permute(chi,tmp,ptype);
} else if ( SE->_is_local ) {
spProjYm(chi,in._odata[SE->_offset]);
} else {
chi=buf[SE->_offset];
}
Impl::multLink(Uchi,U._odata[sU],chi,dir,SE,st);
spReconYm(result,Uchi);
}
// Zm
if ( gamma == Zm ){
if ( SE->_is_local && SE->_permute ) {
spProjZm(tmp,in._odata[SE->_offset]);
permute(chi,tmp,ptype);
} else if ( SE->_is_local ) {
spProjZm(chi,in._odata[SE->_offset]);
} else {
chi=buf[SE->_offset];
}
Impl::multLink(Uchi,U._odata[sU],chi,dir,SE,st);
spReconZm(result,Uchi);
}
// Tm
if ( gamma==Tm ) {
if ( SE->_is_local && SE->_permute ) {
spProjTm(tmp,in._odata[SE->_offset]);
permute(chi,tmp,ptype);
} else if ( SE->_is_local ) {
spProjTm(chi,in._odata[SE->_offset]);
} else {
chi=buf[SE->_offset];
}
Impl::multLink(Uchi,U._odata[sU],chi,dir,SE,st);
spReconTm(result,Uchi);
}
2016-02-15 22:02:36 +00:00
vstream(out._odata[sF],result);
}
FermOpTemplateInstantiate(WilsonKernels);
2016-06-03 11:24:26 +01:00
2016-04-19 23:38:01 +01:00
template class WilsonKernels<DomainWallRedBlack5dImplF>;
template class WilsonKernels<DomainWallRedBlack5dImplD>;
}}