2016-07-18 16:36:28 +01:00
|
|
|
/*************************************************************************************
|
2016-01-02 14:51:32 +00:00
|
|
|
|
2016-07-18 16:36:28 +01:00
|
|
|
Grid physics library, www.github.com/paboyle/Grid
|
2016-01-02 14:51:32 +00:00
|
|
|
|
2016-07-18 16:36:28 +01:00
|
|
|
Source file: ./lib/qcd/action/fermion/WilsonKernels.h
|
2016-01-02 14:51:32 +00:00
|
|
|
|
2016-07-18 16:36:28 +01:00
|
|
|
Copyright (C) 2015
|
2016-01-02 14:51:32 +00:00
|
|
|
|
|
|
|
Author: Peter Boyle <pabobyle@ph.ed.ac.uk>
|
|
|
|
Author: Peter Boyle <paboyle@ph.ed.ac.uk>
|
|
|
|
Author: paboyle <paboyle@ph.ed.ac.uk>
|
|
|
|
|
2016-07-18 16:36:28 +01:00
|
|
|
This program is free software; you can redistribute it and/or modify
|
|
|
|
it under the terms of the GNU General Public License as published by
|
|
|
|
the Free Software Foundation; either version 2 of the License, or
|
|
|
|
(at your option) any later version.
|
2016-01-02 14:51:32 +00:00
|
|
|
|
2016-07-18 16:36:28 +01:00
|
|
|
This program is distributed in the hope that it will be useful,
|
|
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
GNU General Public License for more details.
|
2016-01-02 14:51:32 +00:00
|
|
|
|
2016-07-18 16:36:28 +01:00
|
|
|
You should have received a copy of the GNU General Public License along
|
|
|
|
with this program; if not, write to the Free Software Foundation, Inc.,
|
|
|
|
51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
|
2016-01-02 14:51:32 +00:00
|
|
|
|
2016-07-18 16:36:28 +01:00
|
|
|
See the full license in the file "LICENSE" in the top level distribution
|
|
|
|
directory
|
|
|
|
*************************************************************************************/
|
|
|
|
/* END LEGAL */
|
|
|
|
#ifndef GRID_QCD_DHOP_H
|
|
|
|
#define GRID_QCD_DHOP_H
|
2015-05-31 15:09:02 +01:00
|
|
|
|
|
|
|
namespace Grid {
|
|
|
|
|
|
|
|
namespace QCD {
|
|
|
|
|
|
|
|
////////////////////////////////////////////////////////////////////////////////////////////////////////////////
|
2015-08-10 20:47:44 +01:00
|
|
|
// Helper routines that implement Wilson stencil for a single site.
|
2015-08-15 23:25:49 +01:00
|
|
|
// Common to both the WilsonFermion and WilsonFermion5D
|
2015-05-31 15:09:02 +01:00
|
|
|
////////////////////////////////////////////////////////////////////////////////////////////////////////////////
|
2016-06-03 11:24:26 +01:00
|
|
|
class WilsonKernelsStatic {
|
|
|
|
public:
|
|
|
|
// S-direction is INNERMOST and takes no part in the parity.
|
|
|
|
static int AsmOpt; // these are a temporary hack
|
|
|
|
static int HandOpt; // these are a temporary hack
|
|
|
|
};
|
2015-08-10 20:47:44 +01:00
|
|
|
|
2016-06-03 11:24:26 +01:00
|
|
|
template<class Impl> class WilsonKernels : public FermionOperator<Impl> , public WilsonKernelsStatic {
|
2015-08-10 20:47:44 +01:00
|
|
|
public:
|
|
|
|
|
2016-09-13 10:01:51 +01:00
|
|
|
INHERIT_IMPL_TYPES(Impl);
|
|
|
|
typedef FermionOperator<Impl> Base;
|
2015-08-15 23:25:49 +01:00
|
|
|
|
2015-08-10 20:47:44 +01:00
|
|
|
public:
|
2016-07-18 16:36:28 +01:00
|
|
|
|
2016-09-13 10:01:51 +01:00
|
|
|
template <bool EnableBool = true>
|
|
|
|
typename std::enable_if<Impl::Dimension == 3 && Nc == 3 &&EnableBool, void>::type
|
|
|
|
DiracOptDhopSite(
|
|
|
|
StencilImpl &st, LebesgueOrder &lo, DoubledGaugeField &U,
|
|
|
|
std::vector<SiteHalfSpinor, alignedAllocator<SiteHalfSpinor> > &buf,
|
|
|
|
int sF, int sU, int Ls, int Ns, const FermionField &in,
|
|
|
|
FermionField &out) {
|
2016-07-18 16:36:28 +01:00
|
|
|
#ifdef AVX512
|
2016-09-13 10:01:51 +01:00
|
|
|
if (AsmOpt) {
|
|
|
|
WilsonKernels<Impl>::DiracOptAsmDhopSite(st, lo, U, buf, sF, sU, Ls, Ns,
|
|
|
|
in, out);
|
2016-07-18 16:36:28 +01:00
|
|
|
|
2016-09-13 10:01:51 +01:00
|
|
|
} else {
|
2016-07-18 16:36:28 +01:00
|
|
|
#else
|
2016-09-13 10:01:51 +01:00
|
|
|
{
|
2016-07-18 16:36:28 +01:00
|
|
|
#endif
|
2016-09-13 10:01:51 +01:00
|
|
|
for (int site = 0; site < Ns; site++) {
|
|
|
|
for (int s = 0; s < Ls; s++) {
|
|
|
|
if (HandOpt)
|
|
|
|
WilsonKernels<Impl>::DiracOptHandDhopSite(st, lo, U, buf, sF, sU,
|
|
|
|
in, out);
|
|
|
|
else
|
|
|
|
WilsonKernels<Impl>::DiracOptGenericDhopSite(st, lo, U, buf, sF, sU,
|
|
|
|
in, out);
|
|
|
|
sF++;
|
|
|
|
}
|
|
|
|
sU++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
template <bool EnableBool = true>
|
|
|
|
typename std::enable_if<(Impl::Dimension != 3 || (Impl::Dimension == 3 && Nc != 3)) && EnableBool, void>::type
|
|
|
|
DiracOptDhopSite(
|
|
|
|
StencilImpl &st, LebesgueOrder &lo, DoubledGaugeField &U,
|
|
|
|
std::vector<SiteHalfSpinor, alignedAllocator<SiteHalfSpinor> > &buf,
|
|
|
|
int sF, int sU, int Ls, int Ns, const FermionField &in,
|
|
|
|
FermionField &out) {
|
|
|
|
for (int site = 0; site < Ns; site++) {
|
|
|
|
for (int s = 0; s < Ls; s++) {
|
|
|
|
WilsonKernels<Impl>::DiracOptGenericDhopSite(st, lo, U, buf, sF, sU, in,
|
|
|
|
out);
|
|
|
|
sF++;
|
|
|
|
}
|
|
|
|
sU++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
template <bool EnableBool = true>
|
|
|
|
typename std::enable_if<Impl::Dimension == 3 && Nc == 3 && EnableBool,
|
|
|
|
void>::type
|
|
|
|
DiracOptDhopSiteDag(
|
|
|
|
StencilImpl &st, LebesgueOrder &lo, DoubledGaugeField &U,
|
|
|
|
std::vector<SiteHalfSpinor, alignedAllocator<SiteHalfSpinor> > &buf,
|
|
|
|
int sF, int sU, int Ls, int Ns, const FermionField &in,
|
|
|
|
FermionField &out) {
|
2016-09-01 12:59:53 +01:00
|
|
|
#ifdef AVX512
|
2016-09-13 10:01:51 +01:00
|
|
|
if (AsmOpt) {
|
|
|
|
WilsonKernels<Impl>::DiracOptAsmDhopSiteDag(st, lo, U, buf, sF, sU, Ls,
|
|
|
|
Ns, in, out);
|
|
|
|
} else {
|
2016-09-01 12:59:53 +01:00
|
|
|
#else
|
2016-09-13 10:01:51 +01:00
|
|
|
{
|
2016-09-01 12:59:53 +01:00
|
|
|
#endif
|
2016-09-13 10:01:51 +01:00
|
|
|
for (int site = 0; site < Ns; site++) {
|
|
|
|
for (int s = 0; s < Ls; s++) {
|
|
|
|
if (HandOpt)
|
|
|
|
WilsonKernels<Impl>::DiracOptHandDhopSiteDag(st, lo, U, buf, sF, sU,
|
|
|
|
in, out);
|
|
|
|
else
|
|
|
|
WilsonKernels<Impl>::DiracOptGenericDhopSiteDag(st, lo, U, buf, sF,
|
|
|
|
sU, in, out);
|
|
|
|
sF++;
|
|
|
|
}
|
|
|
|
sU++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
template <bool EnableBool = true>
|
|
|
|
typename std::enable_if<
|
|
|
|
(Impl::Dimension != 3 || (Impl::Dimension == 3 && Nc != 3)) && EnableBool,
|
|
|
|
void>::type
|
|
|
|
DiracOptDhopSiteDag(
|
|
|
|
StencilImpl &st, LebesgueOrder &lo, DoubledGaugeField &U,
|
|
|
|
std::vector<SiteHalfSpinor, alignedAllocator<SiteHalfSpinor> > &buf,
|
|
|
|
int sF, int sU, int Ls, int Ns, const FermionField &in,
|
|
|
|
FermionField &out) {
|
|
|
|
for (int site = 0; site < Ns; site++) {
|
|
|
|
for (int s = 0; s < Ls; s++) {
|
|
|
|
WilsonKernels<Impl>::DiracOptGenericDhopSiteDag(st, lo, U, buf, sF, sU,
|
|
|
|
in, out);
|
|
|
|
sF++;
|
|
|
|
}
|
|
|
|
sU++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void DiracOptDhopDir(
|
|
|
|
StencilImpl &st, DoubledGaugeField &U,
|
|
|
|
std::vector<SiteHalfSpinor, alignedAllocator<SiteHalfSpinor> > &buf,
|
|
|
|
int sF, int sU, const FermionField &in, FermionField &out, int dirdisp,
|
|
|
|
int gamma);
|
|
|
|
|
|
|
|
private:
|
|
|
|
// Specialised variants
|
|
|
|
void DiracOptGenericDhopSite(
|
|
|
|
StencilImpl &st, LebesgueOrder &lo, DoubledGaugeField &U,
|
|
|
|
std::vector<SiteHalfSpinor, alignedAllocator<SiteHalfSpinor> > &buf,
|
|
|
|
int sF, int sU, const FermionField &in, FermionField &out);
|
|
|
|
|
|
|
|
void DiracOptGenericDhopSiteDag(
|
|
|
|
StencilImpl &st, LebesgueOrder &lo, DoubledGaugeField &U,
|
|
|
|
std::vector<SiteHalfSpinor, alignedAllocator<SiteHalfSpinor> > &buf,
|
|
|
|
int sF, int sU, const FermionField &in, FermionField &out);
|
|
|
|
|
|
|
|
void DiracOptAsmDhopSite(
|
|
|
|
StencilImpl &st, LebesgueOrder &lo, DoubledGaugeField &U,
|
|
|
|
std::vector<SiteHalfSpinor, alignedAllocator<SiteHalfSpinor> > &buf,
|
|
|
|
int sF, int sU, int Ls, int Ns, const FermionField &in,
|
|
|
|
FermionField &out);
|
|
|
|
|
|
|
|
void DiracOptAsmDhopSiteDag(
|
|
|
|
StencilImpl &st, LebesgueOrder &lo, DoubledGaugeField &U,
|
|
|
|
std::vector<SiteHalfSpinor, alignedAllocator<SiteHalfSpinor> > &buf,
|
|
|
|
int sF, int sU, int Ls, int Ns, const FermionField &in,
|
|
|
|
FermionField &out);
|
|
|
|
|
|
|
|
void DiracOptHandDhopSite(
|
|
|
|
StencilImpl &st, LebesgueOrder &lo, DoubledGaugeField &U,
|
|
|
|
std::vector<SiteHalfSpinor, alignedAllocator<SiteHalfSpinor> > &buf,
|
|
|
|
int sF, int sU, const FermionField &in, FermionField &out);
|
|
|
|
|
|
|
|
void DiracOptHandDhopSiteDag(
|
|
|
|
StencilImpl &st, LebesgueOrder &lo, DoubledGaugeField &U,
|
|
|
|
std::vector<SiteHalfSpinor, alignedAllocator<SiteHalfSpinor> > &buf,
|
|
|
|
int sF, int sU, const FermionField &in, FermionField &out);
|
|
|
|
|
|
|
|
public:
|
|
|
|
WilsonKernels(const ImplParams &p = ImplParams());
|
|
|
|
};
|
2016-09-09 10:53:22 +01:00
|
|
|
|
2016-09-13 10:01:51 +01:00
|
|
|
///////////////////////////////////////////////////////////
|
|
|
|
// Default to no assembler implementation
|
|
|
|
///////////////////////////////////////////////////////////
|
|
|
|
template<class Impl>
|
|
|
|
void WilsonKernels<Impl >::DiracOptAsmDhopSite(StencilImpl &st,LebesgueOrder & lo,DoubledGaugeField &U,
|
|
|
|
std::vector<SiteHalfSpinor,alignedAllocator<SiteHalfSpinor> > &buf,
|
|
|
|
int ss,int ssU,int Ls,int Ns,const FermionField &in, FermionField &out)
|
|
|
|
{
|
|
|
|
assert(0);
|
|
|
|
}
|
|
|
|
template<class Impl>
|
|
|
|
void WilsonKernels<Impl >::DiracOptAsmDhopSiteDag(StencilImpl &st,LebesgueOrder & lo,DoubledGaugeField &U,
|
|
|
|
std::vector<SiteHalfSpinor,alignedAllocator<SiteHalfSpinor> > &buf,
|
|
|
|
int ss,int ssU,int Ls,int Ns,const FermionField &in, FermionField &out)
|
|
|
|
{
|
|
|
|
assert(0);
|
|
|
|
}
|
|
|
|
|
2016-07-18 16:36:28 +01:00
|
|
|
}
|
|
|
|
}
|
2015-05-31 15:09:02 +01:00
|
|
|
#endif
|