mirror of
https://github.com/paboyle/Grid.git
synced 2024-11-10 07:55:35 +00:00
Faster implementation of conserved current site contraction. Added 5D vectorised support, but not G-parity.
This commit is contained in:
parent
2d433ba307
commit
5633a2db20
@ -212,6 +212,13 @@ namespace QCD {
|
||||
StencilImpl &St) {
|
||||
mult(&phi(), &U(mu), &chi());
|
||||
}
|
||||
|
||||
inline void multLinkProp(SitePropagator &phi,
|
||||
const SiteDoubledGaugeField &U,
|
||||
const SitePropagator &chi,
|
||||
int mu) {
|
||||
mult(&phi(), &U(mu), &chi());
|
||||
}
|
||||
|
||||
template <class ref>
|
||||
inline void loadLinkElement(Simd ®, ref &memory) {
|
||||
@ -340,7 +347,20 @@ class DomainWallVec5dImpl : public PeriodicGaugeImpl< GaugeImplTypes< S,Nrepres
|
||||
}
|
||||
mult(&phi(), &UU(), &chi());
|
||||
}
|
||||
|
||||
|
||||
inline void multLinkProp(SitePropagator &phi,
|
||||
const SiteDoubledGaugeField &U,
|
||||
const SitePropagator &chi,
|
||||
int mu) {
|
||||
SiteGaugeLink UU;
|
||||
for (int i = 0; i < Nrepresentation; i++) {
|
||||
for (int j = 0; j < Nrepresentation; j++) {
|
||||
vsplat(UU()()(i, j), U(mu)()(i, j));
|
||||
}
|
||||
}
|
||||
mult(&phi(), &UU(), &chi());
|
||||
}
|
||||
|
||||
inline void DoubleStore(GridBase *GaugeGrid, DoubledGaugeField &Uds,const GaugeField &Umu)
|
||||
{
|
||||
SiteScalarGaugeField ScalarUmu;
|
||||
@ -538,6 +558,13 @@ class GparityWilsonImpl : public ConjugateGaugeImpl<GaugeImplTypes<S, Nrepresent
|
||||
|
||||
}
|
||||
|
||||
// Fixme: Gparity prop * link
|
||||
inline void multLinkProp(SitePropagator &phi, const SiteDoubledGaugeField &U,
|
||||
const SitePropagator &chi, int mu)
|
||||
{
|
||||
assert(0);
|
||||
}
|
||||
|
||||
inline void DoubleStore(GridBase *GaugeGrid,DoubledGaugeField &Uds,const GaugeField &Umu)
|
||||
{
|
||||
conformable(Uds._grid,GaugeGrid);
|
||||
|
@ -361,8 +361,24 @@ void WilsonFermion<Impl>::ContractConservedCurrent(PropagatorField &q_in_1,
|
||||
conformable(_grid, q_in_1._grid);
|
||||
conformable(_grid, q_in_2._grid);
|
||||
conformable(_grid, q_out._grid);
|
||||
Kernels::ContractConservedCurrentInternal(q_in_1, q_in_2, q_out,
|
||||
Umu, curr_type, mu);
|
||||
PropagatorField tmp(_grid);
|
||||
q_out = zero;
|
||||
|
||||
// Forward, need q1(x + mu), q2(x)
|
||||
tmp = Cshift(q_in_1, mu, 1);
|
||||
parallel_for (unsigned int sU = 0; sU < Umu._grid->oSites(); ++sU)
|
||||
{
|
||||
Kernels::ContractConservedCurrentSiteFwd(tmp, q_in_2, q_out, Umu,
|
||||
mu, sU, sU, sU, sU);
|
||||
}
|
||||
|
||||
// Backward, need q1(x), q2(x + mu)
|
||||
tmp = Cshift(q_in_2, mu, 1);
|
||||
parallel_for (unsigned int sU = 0; sU < Umu._grid->oSites(); ++sU)
|
||||
{
|
||||
Kernels::ContractConservedCurrentSiteBwd(q_in_1, tmp, q_out, Umu,
|
||||
mu, sU, sU, sU, sU);
|
||||
}
|
||||
}
|
||||
|
||||
template <class Impl>
|
||||
|
@ -687,26 +687,44 @@ void WilsonFermion5D<Impl>::ContractConservedCurrent(PropagatorField &q_in_1,
|
||||
conformable(q_in_1._grid, q_in_2._grid);
|
||||
conformable(_FourDimGrid, q_out._grid);
|
||||
|
||||
PropagatorField q1_s(_FourDimGrid);
|
||||
PropagatorField q2_s(_FourDimGrid);
|
||||
PropagatorField tmp(_FourDimGrid);
|
||||
|
||||
// Contract across 5th dimension.
|
||||
PropagatorField tmp(FermionGrid());
|
||||
q_out = zero;
|
||||
for (int s = 0; s < Ls; ++s)
|
||||
{
|
||||
ExtractSlice(q1_s, q_in_1, s, 0);
|
||||
ExtractSlice(q2_s, q_in_2, Ls - s - 1, 0);
|
||||
Kernels::ContractConservedCurrentInternal(q1_s, q2_s, tmp, Umu, curr_type, mu);
|
||||
|
||||
// Axial current sign
|
||||
if ((curr_type == Current::Axial) && (s < (Ls / 2)))
|
||||
// Forward, need q1(x + mu, s), q2(x, Ls - 1 - s). 5D lattice so shift
|
||||
// 4D coordinate mu by one.
|
||||
tmp = Cshift(q_in_1, mu + 1, 1);
|
||||
parallel_for (unsigned int sU = 0; sU < Umu._grid->oSites(); ++sU)
|
||||
{
|
||||
unsigned int sF1 = sU * Ls;
|
||||
unsigned int sF2 = (sU + 1) * Ls - 1;
|
||||
for (int s = 0; s < Ls; ++s)
|
||||
{
|
||||
q_out -= tmp;
|
||||
bool axial_sign = ((curr_type == Current::Axial) && (s < (Ls / 2))) ? \
|
||||
true : false;
|
||||
Kernels::ContractConservedCurrentSiteFwd(tmp, q_in_2, q_out, Umu,
|
||||
mu, sF1, sF2, sU, sU,
|
||||
axial_sign);
|
||||
sF1++;
|
||||
sF2--;
|
||||
}
|
||||
else
|
||||
}
|
||||
|
||||
// Backward, need q1(x, s), q2(x + mu, Ls - 1 - s). 5D lattice so shift
|
||||
// 4D coordinate mu by one.
|
||||
tmp = Cshift(q_in_2, mu + 1, 1);
|
||||
parallel_for (unsigned int sU = 0; sU < Umu._grid->oSites(); ++sU)
|
||||
{
|
||||
unsigned int sF1 = sU * Ls;
|
||||
unsigned int sF2 = (sU + 1) * Ls - 1;
|
||||
for (int s = 0; s < Ls; ++s)
|
||||
{
|
||||
q_out += tmp;
|
||||
bool axial_sign = ((curr_type == Current::Axial) && (s < (Ls / 2))) ? \
|
||||
true : false;
|
||||
Kernels::ContractConservedCurrentSiteBwd(q_in_1, tmp, q_out, Umu,
|
||||
mu, sF1, sF2, sU, sU,
|
||||
axial_sign);
|
||||
sF1++;
|
||||
sF2--;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
@ -290,26 +290,110 @@ void WilsonKernels<Impl>::DhopDir( StencilImpl &st, DoubledGaugeField &U,SiteHal
|
||||
#define WilsonCurrentFwd(expr, mu) ((expr - Gamma::gmu[mu]*expr))
|
||||
#define WilsonCurrentBwd(expr, mu) ((expr + Gamma::gmu[mu]*expr))
|
||||
|
||||
/*******************************************************************************
|
||||
* Name: ContractConservedCurrentSiteFwd
|
||||
* Operation: (1/2) * q2[x] * U(x) * (g[mu] - 1) * q1[x + mu]
|
||||
* Notes: - DoubledGaugeField U assumed to contain -1/2 factor.
|
||||
* - Pass in q_in_1 shifted in +ve mu direction.
|
||||
******************************************************************************/
|
||||
template<class Impl>
|
||||
void WilsonKernels<Impl>::ContractConservedCurrentInternal(const PropagatorField &q_in_1,
|
||||
const PropagatorField &q_in_2,
|
||||
PropagatorField &q_out,
|
||||
DoubledGaugeField &U,
|
||||
Current curr_type,
|
||||
unsigned int mu)
|
||||
void WilsonKernels<Impl>::ContractConservedCurrentSiteFwd(
|
||||
const PropagatorField &q_in_1,
|
||||
const PropagatorField &q_in_2,
|
||||
PropagatorField &q_out,
|
||||
DoubledGaugeField &U,
|
||||
unsigned int mu,
|
||||
unsigned int sF_in_1,
|
||||
unsigned int sF_in_2,
|
||||
unsigned int sF_out,
|
||||
unsigned int sU,
|
||||
bool switch_sign)
|
||||
{
|
||||
SitePropagator result, tmp;
|
||||
Gamma g5(Gamma::Algebra::Gamma5);
|
||||
PropagatorField tmp(q_out._grid);
|
||||
GaugeLinkField Umu(U._grid);
|
||||
Umu = PeekIndex<LorentzIndex>(U, mu);
|
||||
|
||||
tmp = this->CovShiftForward(Umu, mu, q_in_1);
|
||||
q_out = (g5*adj(q_in_2)*g5)*WilsonCurrentFwd(tmp, mu);
|
||||
|
||||
tmp = this->CovShiftForward(Umu, mu, q_in_2);
|
||||
q_out -= (g5*adj(tmp)*g5)*WilsonCurrentBwd(q_in_1, mu);
|
||||
multLinkProp(tmp, U._odata[sU], q_in_1._odata[sF_in_1], mu);
|
||||
result = g5 * adj(q_in_2._odata[sF_in_2]) * g5 * WilsonCurrentFwd(tmp, mu);
|
||||
if (switch_sign)
|
||||
{
|
||||
q_out._odata[sF_out] -= result;
|
||||
}
|
||||
else
|
||||
{
|
||||
q_out._odata[sF_out] += result;
|
||||
}
|
||||
}
|
||||
|
||||
/*******************************************************************************
|
||||
* Name: ContractConservedCurrentSiteBwd
|
||||
* Operation: (1/2) * q2[x + mu] * U^dag(x) * (g[mu] + 1) * q1[x]
|
||||
* Notes: - DoubledGaugeField U assumed to contain -1/2 factor.
|
||||
* - Pass in q_in_2 shifted in +ve mu direction.
|
||||
******************************************************************************/
|
||||
template<class Impl>
|
||||
void WilsonKernels<Impl>::ContractConservedCurrentSiteBwd(
|
||||
const PropagatorField &q_in_1,
|
||||
const PropagatorField &q_in_2,
|
||||
PropagatorField &q_out,
|
||||
DoubledGaugeField &U,
|
||||
unsigned int mu,
|
||||
unsigned int sF_in_1,
|
||||
unsigned int sF_in_2,
|
||||
unsigned int sF_out,
|
||||
unsigned int sU,
|
||||
bool switch_sign)
|
||||
{
|
||||
SitePropagator result, tmp;
|
||||
Gamma g5(Gamma::Algebra::Gamma5);
|
||||
multLinkProp(tmp, U._odata[sU], q_in_1._odata[sF_in_1], mu + Nd);
|
||||
result = g5 * adj(q_in_2._odata[sF_in_2]) * g5 * WilsonCurrentBwd(tmp, mu);
|
||||
if (switch_sign)
|
||||
{
|
||||
q_out._odata[sF_out] += result;
|
||||
}
|
||||
else
|
||||
{
|
||||
q_out._odata[sF_out] -= result;
|
||||
}
|
||||
}
|
||||
|
||||
// G-parity requires more specialised implementation.
|
||||
#define NO_CURR_SITE(Impl) \
|
||||
template <> \
|
||||
void WilsonKernels<Impl>::ContractConservedCurrentSiteFwd( \
|
||||
const PropagatorField &q_in_1, \
|
||||
const PropagatorField &q_in_2, \
|
||||
PropagatorField &q_out, \
|
||||
DoubledGaugeField &U, \
|
||||
unsigned int mu, \
|
||||
unsigned int sF_in_1, \
|
||||
unsigned int sF_in_2, \
|
||||
unsigned int sF_out, \
|
||||
unsigned int sU, \
|
||||
bool switch_sign) \
|
||||
{ \
|
||||
assert(0); \
|
||||
} \
|
||||
template <> \
|
||||
void WilsonKernels<Impl>::ContractConservedCurrentSiteBwd( \
|
||||
const PropagatorField &q_in_1, \
|
||||
const PropagatorField &q_in_2, \
|
||||
PropagatorField &q_out, \
|
||||
DoubledGaugeField &U, \
|
||||
unsigned int mu, \
|
||||
unsigned int sF_in_1, \
|
||||
unsigned int sF_in_2, \
|
||||
unsigned int sF_out, \
|
||||
unsigned int sU, \
|
||||
bool switch_sign) \
|
||||
{ \
|
||||
assert(0); \
|
||||
}
|
||||
|
||||
NO_CURR_SITE(GparityWilsonImplF);
|
||||
NO_CURR_SITE(GparityWilsonImplD);
|
||||
NO_CURR_SITE(GparityWilsonImplFH);
|
||||
NO_CURR_SITE(GparityWilsonImplDF);
|
||||
|
||||
|
||||
template <class Impl>
|
||||
void WilsonKernels<Impl>::SeqConservedCurrentInternal(const PropagatorField &q_in,
|
||||
@ -342,16 +426,6 @@ void WilsonKernels<Impl>::SeqConservedCurrentInternal(const PropagatorField &q_i
|
||||
|
||||
// GParity, (Z)DomainWallVec5D -> require special implementation
|
||||
#define NO_CURR(Impl) \
|
||||
template <> void \
|
||||
WilsonKernels<Impl>::ContractConservedCurrentInternal(const PropagatorField &q_in_1, \
|
||||
const PropagatorField &q_in_2, \
|
||||
PropagatorField &q_out, \
|
||||
DoubledGaugeField &U, \
|
||||
Current curr_type, \
|
||||
unsigned int mu) \
|
||||
{ \
|
||||
assert(0); \
|
||||
} \
|
||||
template <> void \
|
||||
WilsonKernels<Impl>::SeqConservedCurrentInternal(const PropagatorField &q_in, \
|
||||
PropagatorField &q_out, \
|
||||
|
@ -183,12 +183,26 @@ public:
|
||||
//////////////////////////////////////////////////////////////////////////////
|
||||
// Utilities for inserting Wilson conserved current.
|
||||
//////////////////////////////////////////////////////////////////////////////
|
||||
void ContractConservedCurrentInternal(const PropagatorField &q_in_1,
|
||||
const PropagatorField &q_in_2,
|
||||
PropagatorField &q_out,
|
||||
DoubledGaugeField &U,
|
||||
Current curr_type,
|
||||
unsigned int mu);
|
||||
void ContractConservedCurrentSiteFwd(const PropagatorField &q_in_1,
|
||||
const PropagatorField &q_in_2,
|
||||
PropagatorField &q_out,
|
||||
DoubledGaugeField &U,
|
||||
unsigned int mu,
|
||||
unsigned int sF_in_1,
|
||||
unsigned int sF_in_2,
|
||||
unsigned int sF_out,
|
||||
unsigned int sU,
|
||||
bool switch_sign = false);
|
||||
void ContractConservedCurrentSiteBwd(const PropagatorField &q_in_1,
|
||||
const PropagatorField &q_in_2,
|
||||
PropagatorField &q_out,
|
||||
DoubledGaugeField &U,
|
||||
unsigned int mu,
|
||||
unsigned int sF_in_1,
|
||||
unsigned int sF_in_2,
|
||||
unsigned int sF_out,
|
||||
unsigned int sU,
|
||||
bool switch_sign = false);
|
||||
void SeqConservedCurrentInternal(const PropagatorField &q_in,
|
||||
PropagatorField &q_out,
|
||||
DoubledGaugeField &U,
|
||||
|
Loading…
Reference in New Issue
Block a user