From 1b6b12589f7634ce1eecda5b3b5ce0a20897dfce Mon Sep 17 00:00:00 2001 From: Daniel Richtmann Date: Tue, 1 Feb 2022 22:41:01 +0100 Subject: [PATCH] Get splitting up into implementation and instantiation files correct --- .../fermion/CompactWilsonCloverFermion.h | 296 +------------- Grid/qcd/action/fermion/Fermion.h | 18 + ...CompactWilsonCloverFermionImplementation.h | 363 ++++++++++++++++++ ...WilsonCloverFermionInstantiation.cc.master | 41 ++ ...rFermionInstantiationGparityWilsonImplD.cc | 1 + ...rFermionInstantiationGparityWilsonImplF.cc | 1 + ...loverFermionInstantiationWilsonAdjImplD.cc | 1 + ...loverFermionInstantiationWilsonAdjImplF.cc | 1 + ...onCloverFermionInstantiationWilsonImplD.cc | 1 + ...onCloverFermionInstantiationWilsonImplF.cc | 1 + ...tiationWilsonTwoIndexAntiSymmetricImplD.cc | 1 + ...tiationWilsonTwoIndexAntiSymmetricImplF.cc | 1 + ...stantiationWilsonTwoIndexSymmetricImplD.cc | 1 + ...stantiationWilsonTwoIndexSymmetricImplF.cc | 1 + .../instantiation/generate_instantiations.sh | 2 +- 15 files changed, 454 insertions(+), 276 deletions(-) create mode 100644 Grid/qcd/action/fermion/implementation/CompactWilsonCloverFermionImplementation.h create mode 100644 Grid/qcd/action/fermion/instantiation/CompactWilsonCloverFermionInstantiation.cc.master create mode 120000 Grid/qcd/action/fermion/instantiation/GparityWilsonImplD/CompactWilsonCloverFermionInstantiationGparityWilsonImplD.cc create mode 120000 Grid/qcd/action/fermion/instantiation/GparityWilsonImplF/CompactWilsonCloverFermionInstantiationGparityWilsonImplF.cc create mode 120000 Grid/qcd/action/fermion/instantiation/WilsonAdjImplD/CompactWilsonCloverFermionInstantiationWilsonAdjImplD.cc create mode 120000 Grid/qcd/action/fermion/instantiation/WilsonAdjImplF/CompactWilsonCloverFermionInstantiationWilsonAdjImplF.cc create mode 120000 Grid/qcd/action/fermion/instantiation/WilsonImplD/CompactWilsonCloverFermionInstantiationWilsonImplD.cc create mode 120000 Grid/qcd/action/fermion/instantiation/WilsonImplF/CompactWilsonCloverFermionInstantiationWilsonImplF.cc create mode 120000 Grid/qcd/action/fermion/instantiation/WilsonTwoIndexAntiSymmetricImplD/CompactWilsonCloverFermionInstantiationWilsonTwoIndexAntiSymmetricImplD.cc create mode 120000 Grid/qcd/action/fermion/instantiation/WilsonTwoIndexAntiSymmetricImplF/CompactWilsonCloverFermionInstantiationWilsonTwoIndexAntiSymmetricImplF.cc create mode 120000 Grid/qcd/action/fermion/instantiation/WilsonTwoIndexSymmetricImplD/CompactWilsonCloverFermionInstantiationWilsonTwoIndexSymmetricImplD.cc create mode 120000 Grid/qcd/action/fermion/instantiation/WilsonTwoIndexSymmetricImplF/CompactWilsonCloverFermionInstantiationWilsonTwoIndexSymmetricImplF.cc diff --git a/Grid/qcd/action/fermion/CompactWilsonCloverFermion.h b/Grid/qcd/action/fermion/CompactWilsonCloverFermion.h index 550bef85..3a166134 100644 --- a/Grid/qcd/action/fermion/CompactWilsonCloverFermion.h +++ b/Grid/qcd/action/fermion/CompactWilsonCloverFermion.h @@ -125,31 +125,7 @@ public: const RealD _csw_t = 0.0, const RealD _cF = 1.0, const WilsonAnisotropyCoefficients& clover_anisotropy = WilsonAnisotropyCoefficients(), - const ImplParams& impl_p = ImplParams()) - : WilsonBase(_Umu, Fgrid, Hgrid, _mass, impl_p, clover_anisotropy) - , csw_r(_csw_r) - , csw_t(_csw_t) - , cF(_cF) - , open_boundaries(impl_p.boundary_phases[Nd-1] == 0.0) - , Diagonal(&Fgrid), Triangle(&Fgrid) - , DiagonalEven(&Hgrid), TriangleEven(&Hgrid) - , DiagonalOdd(&Hgrid), TriangleOdd(&Hgrid) - , DiagonalInv(&Fgrid), TriangleInv(&Fgrid) - , DiagonalInvEven(&Hgrid), TriangleInvEven(&Hgrid) - , DiagonalInvOdd(&Hgrid), TriangleInvOdd(&Hgrid) - , Tmp(&Fgrid) - , BoundaryMask(&Fgrid) - , BoundaryMaskEven(&Hgrid), BoundaryMaskOdd(&Hgrid) - { - csw_r *= 0.5; - csw_t *= 0.5; - if (clover_anisotropy.isAnisotropic) - csw_r /= clover_anisotropy.xi_0; - - ImportGauge(_Umu); - if (open_boundaries) - CompactHelpers::SetupMasks(this->BoundaryMask, this->BoundaryMaskEven, this->BoundaryMaskOdd); - } + const ImplParams& impl_p = ImplParams()); ///////////////////////////////////////////// // Member functions (implementing interface) @@ -161,191 +137,41 @@ public: int ConstEE() override { return 0; }; int isTrivialEE() override { return 0; }; + void Dhop(const FermionField& in, FermionField& out, int dag) override; - void Dhop(const FermionField& in, FermionField& out, int dag) override { - WilsonBase::Dhop(in, out, dag); - if(open_boundaries) ApplyBoundaryMask(out); - } + void DhopOE(const FermionField& in, FermionField& out, int dag) override; - void DhopOE(const FermionField& in, FermionField& out, int dag) override { - WilsonBase::DhopOE(in, out, dag); - if(open_boundaries) ApplyBoundaryMask(out); - } + void DhopEO(const FermionField& in, FermionField& out, int dag) override; - void DhopEO(const FermionField& in, FermionField& out, int dag) override { - WilsonBase::DhopEO(in, out, dag); - if(open_boundaries) ApplyBoundaryMask(out); - } + void DhopDir(const FermionField& in, FermionField& out, int dir, int disp) override; - void DhopDir(const FermionField& in, FermionField& out, int dir, int disp) override { - WilsonBase::DhopDir(in, out, dir, disp); - if(this->open_boundaries) ApplyBoundaryMask(out); - } + void DhopDirAll(const FermionField& in, std::vector& out) /* override */; - void DhopDirAll(const FermionField& in, std::vector& out) /* override */ { - WilsonBase::DhopDirAll(in, out); - if(this->open_boundaries) { - for(auto& o : out) ApplyBoundaryMask(o); - } - } + void M(const FermionField& in, FermionField& out) override; - void M(const FermionField& in, FermionField& out) override { - out.Checkerboard() = in.Checkerboard(); - WilsonBase::Dhop(in, out, DaggerNo); // call base to save applying bc - Mooee(in, Tmp); - axpy(out, 1.0, out, Tmp); - if(open_boundaries) ApplyBoundaryMask(out); - } + void Mdag(const FermionField& in, FermionField& out) override; - void Mdag(const FermionField& in, FermionField& out) override { - out.Checkerboard() = in.Checkerboard(); - WilsonBase::Dhop(in, out, DaggerYes); // call base to save applying bc - MooeeDag(in, Tmp); - axpy(out, 1.0, out, Tmp); - if(open_boundaries) ApplyBoundaryMask(out); - } + void Meooe(const FermionField& in, FermionField& out) override; - void Meooe(const FermionField& in, FermionField& out) override { - WilsonBase::Meooe(in, out); - if(open_boundaries) ApplyBoundaryMask(out); - } + void MeooeDag(const FermionField& in, FermionField& out) override; - void MeooeDag(const FermionField& in, FermionField& out) override { - WilsonBase::MeooeDag(in, out); - if(open_boundaries) ApplyBoundaryMask(out); - } + void Mooee(const FermionField& in, FermionField& out) override; - void Mooee(const FermionField& in, FermionField& out) override { - if(in.Grid()->_isCheckerBoarded) { - if(in.Checkerboard() == Odd) { - MooeeInternal(in, out, DiagonalOdd, TriangleOdd); - } else { - MooeeInternal(in, out, DiagonalEven, TriangleEven); - } - } else { - MooeeInternal(in, out, Diagonal, Triangle); - } - if(open_boundaries) ApplyBoundaryMask(out); - } + void MooeeDag(const FermionField& in, FermionField& out) override; - void MooeeDag(const FermionField& in, FermionField& out) override { - Mooee(in, out); // blocks are hermitian - } + void MooeeInv(const FermionField& in, FermionField& out) override; - void MooeeInv(const FermionField& in, FermionField& out) override { - if(in.Grid()->_isCheckerBoarded) { - if(in.Checkerboard() == Odd) { - MooeeInternal(in, out, DiagonalInvOdd, TriangleInvOdd); - } else { - MooeeInternal(in, out, DiagonalInvEven, TriangleInvEven); - } - } else { - MooeeInternal(in, out, DiagonalInv, TriangleInv); - } - if(open_boundaries) ApplyBoundaryMask(out); - } + void MooeeInvDag(const FermionField& in, FermionField& out) override; - void MooeeInvDag(const FermionField& in, FermionField& out) override { - MooeeInv(in, out); // blocks are hermitian - } + void Mdir(const FermionField& in, FermionField& out, int dir, int disp) override; - void Mdir(const FermionField& in, FermionField& out, int dir, int disp) override { - DhopDir(in, out, dir, disp); - } + void MdirAll(const FermionField& in, std::vector& out) override; - void MdirAll(const FermionField& in, std::vector& out) override { - DhopDirAll(in, out); - } + void MDeriv(GaugeField& force, const FermionField& X, const FermionField& Y, int dag) override; - void MDeriv(GaugeField& force, const FermionField& X, const FermionField& Y, int dag) override { - assert(!open_boundaries); // TODO check for changes required for open bc + void MooDeriv(GaugeField& mat, const FermionField& U, const FermionField& V, int dag) override; - // NOTE: code copied from original clover term - conformable(X.Grid(), Y.Grid()); - conformable(X.Grid(), force.Grid()); - GaugeLinkField force_mu(force.Grid()), lambda(force.Grid()); - GaugeField clover_force(force.Grid()); - PropagatorField Lambda(force.Grid()); - - // Guido: Here we are hitting some performance issues: - // need to extract the components of the DoubledGaugeField - // for each call - // Possible solution - // Create a vector object to store them? (cons: wasting space) - std::vector U(Nd, this->Umu.Grid()); - - Impl::extractLinkField(U, this->Umu); - - force = Zero(); - // Derivative of the Wilson hopping term - this->DhopDeriv(force, X, Y, dag); - - /////////////////////////////////////////////////////////// - // Clover term derivative - /////////////////////////////////////////////////////////// - Impl::outerProductImpl(Lambda, X, Y); - //std::cout << "Lambda:" << Lambda << std::endl; - - Gamma::Algebra sigma[] = { - Gamma::Algebra::SigmaXY, - Gamma::Algebra::SigmaXZ, - Gamma::Algebra::SigmaXT, - Gamma::Algebra::MinusSigmaXY, - Gamma::Algebra::SigmaYZ, - Gamma::Algebra::SigmaYT, - Gamma::Algebra::MinusSigmaXZ, - Gamma::Algebra::MinusSigmaYZ, - Gamma::Algebra::SigmaZT, - Gamma::Algebra::MinusSigmaXT, - Gamma::Algebra::MinusSigmaYT, - Gamma::Algebra::MinusSigmaZT}; - - /* - sigma_{\mu \nu}= - | 0 sigma[0] sigma[1] sigma[2] | - | sigma[3] 0 sigma[4] sigma[5] | - | sigma[6] sigma[7] 0 sigma[8] | - | sigma[9] sigma[10] sigma[11] 0 | - */ - - int count = 0; - clover_force = Zero(); - for (int mu = 0; mu < 4; mu++) - { - force_mu = Zero(); - for (int nu = 0; nu < 4; nu++) - { - if (mu == nu) - continue; - - RealD factor; - if (nu == 4 || mu == 4) - { - factor = 2.0 * csw_t; - } - else - { - factor = 2.0 * csw_r; - } - PropagatorField Slambda = Gamma(sigma[count]) * Lambda; // sigma checked - Impl::TraceSpinImpl(lambda, Slambda); // traceSpin ok - force_mu -= factor*Helpers::Cmunu(U, lambda, mu, nu); // checked - count++; - } - - pokeLorentz(clover_force, U[mu] * force_mu, mu); - } - //clover_force *= csw; - force += clover_force; - } - - void MooDeriv(GaugeField& mat, const FermionField& U, const FermionField& V, int dag) override { - assert(0); - } - - void MeeDeriv(GaugeField& mat, const FermionField& U, const FermionField& V, int dag) override { - assert(0); - } + void MeeDeriv(GaugeField& mat, const FermionField& U, const FermionField& V, int dag) override; ///////////////////////////////////////////// // Member functions (internals) @@ -354,93 +180,13 @@ public: void MooeeInternal(const FermionField& in, FermionField& out, const CloverDiagonalField& diagonal, - const CloverTriangleField& triangle) { - assert(in.Checkerboard() == Odd || in.Checkerboard() == Even); - out.Checkerboard() = in.Checkerboard(); - conformable(in, out); - conformable(in, diagonal); - conformable(in, triangle); - - CompactHelpers::MooeeKernel(diagonal.oSites(), 1, in, out, diagonal, triangle); - } + const CloverTriangleField& triangle); ///////////////////////////////////////////// // Helpers ///////////////////////////////////////////// - void ImportGauge(const GaugeField& _Umu) override { - // NOTE: parts copied from original implementation - - // Import gauge into base class - double t0 = usecond(); - WilsonBase::ImportGauge(_Umu); // NOTE: called here and in wilson constructor -> performed twice, but can't avoid that - - // Initialize temporary variables - double t1 = usecond(); - conformable(_Umu.Grid(), this->GaugeGrid()); - GridBase* grid = _Umu.Grid(); - typename Impl::GaugeLinkField Bx(grid), By(grid), Bz(grid), Ex(grid), Ey(grid), Ez(grid); - CloverField TmpOriginal(grid); - - // Compute the field strength terms mu>nu - double t2 = usecond(); - WilsonLoops::FieldStrength(Bx, _Umu, Zdir, Ydir); - WilsonLoops::FieldStrength(By, _Umu, Zdir, Xdir); - WilsonLoops::FieldStrength(Bz, _Umu, Ydir, Xdir); - WilsonLoops::FieldStrength(Ex, _Umu, Tdir, Xdir); - WilsonLoops::FieldStrength(Ey, _Umu, Tdir, Ydir); - WilsonLoops::FieldStrength(Ez, _Umu, Tdir, Zdir); - - // Compute the Clover Operator acting on Colour and Spin - // multiply here by the clover coefficients for the anisotropy - double t3 = usecond(); - TmpOriginal = Helpers::fillCloverYZ(Bx) * csw_r; - TmpOriginal += Helpers::fillCloverXZ(By) * csw_r; - TmpOriginal += Helpers::fillCloverXY(Bz) * csw_r; - TmpOriginal += Helpers::fillCloverXT(Ex) * csw_t; - TmpOriginal += Helpers::fillCloverYT(Ey) * csw_t; - TmpOriginal += Helpers::fillCloverZT(Ez) * csw_t; - TmpOriginal += this->diag_mass; - - // Convert the data layout of the clover term - double t4 = usecond(); - CompactHelpers::ConvertLayout(TmpOriginal, Diagonal, Triangle); - - // Possible modify the boundary values - double t5 = usecond(); - if(open_boundaries) CompactHelpers::ModifyBoundaries(Diagonal, Triangle, csw_t, cF, this->diag_mass); - - // Invert the clover term in the improved layout - double t6 = usecond(); - CompactHelpers::Invert(Diagonal, Triangle, DiagonalInv, TriangleInv); - - // Fill the remaining clover fields - double t7 = usecond(); - pickCheckerboard(Even, DiagonalEven, Diagonal); - pickCheckerboard(Even, TriangleEven, Triangle); - pickCheckerboard(Odd, DiagonalOdd, Diagonal); - pickCheckerboard(Odd, TriangleOdd, Triangle); - pickCheckerboard(Even, DiagonalInvEven, DiagonalInv); - pickCheckerboard(Even, TriangleInvEven, TriangleInv); - pickCheckerboard(Odd, DiagonalInvOdd, DiagonalInv); - pickCheckerboard(Odd, TriangleInvOdd, TriangleInv); - - // Report timings - double t8 = usecond(); -#if 0 - std::cout << GridLogMessage << "CompactWilsonCloverFermion::ImportGauge timings:" - << " WilsonFermion::Importgauge = " << (t1 - t0) / 1e6 - << ", allocations = " << (t2 - t1) / 1e6 - << ", field strength = " << (t3 - t2) / 1e6 - << ", fill clover = " << (t4 - t3) / 1e6 - << ", convert = " << (t5 - t4) / 1e6 - << ", boundaries = " << (t6 - t5) / 1e6 - << ", inversions = " << (t7 - t6) / 1e6 - << ", pick cbs = " << (t8 - t7) / 1e6 - << ", total = " << (t8 - t0) / 1e6 - << std::endl; -#endif - } + void ImportGauge(const GaugeField& _Umu) override; ///////////////////////////////////////////// // Helpers diff --git a/Grid/qcd/action/fermion/Fermion.h b/Grid/qcd/action/fermion/Fermion.h index 59fc17d5..78cf7851 100644 --- a/Grid/qcd/action/fermion/Fermion.h +++ b/Grid/qcd/action/fermion/Fermion.h @@ -53,6 +53,7 @@ NAMESPACE_CHECK(Wilson); #include // 4d wilson like NAMESPACE_CHECK(WilsonTM); #include // 4d wilson clover fermions +#include // 4d compact wilson clover fermions NAMESPACE_CHECK(WilsonClover); #include // 5d base used by all 5d overlap types NAMESPACE_CHECK(Wilson5D); @@ -153,6 +154,23 @@ typedef WilsonCloverFermion WilsonCloverTwoInd typedef WilsonCloverFermion WilsonCloverTwoIndexAntiSymmetricFermionF; typedef WilsonCloverFermion WilsonCloverTwoIndexAntiSymmetricFermionD; +// Compact Clover fermions +typedef CompactWilsonCloverFermion CompactWilsonCloverFermionR; +typedef CompactWilsonCloverFermion CompactWilsonCloverFermionF; +typedef CompactWilsonCloverFermion CompactWilsonCloverFermionD; + +typedef CompactWilsonCloverFermion CompactWilsonCloverAdjFermionR; +typedef CompactWilsonCloverFermion CompactWilsonCloverAdjFermionF; +typedef CompactWilsonCloverFermion CompactWilsonCloverAdjFermionD; + +typedef CompactWilsonCloverFermion CompactWilsonCloverTwoIndexSymmetricFermionR; +typedef CompactWilsonCloverFermion CompactWilsonCloverTwoIndexSymmetricFermionF; +typedef CompactWilsonCloverFermion CompactWilsonCloverTwoIndexSymmetricFermionD; + +typedef CompactWilsonCloverFermion CompactWilsonCloverTwoIndexAntiSymmetricFermionR; +typedef CompactWilsonCloverFermion CompactWilsonCloverTwoIndexAntiSymmetricFermionF; +typedef CompactWilsonCloverFermion CompactWilsonCloverTwoIndexAntiSymmetricFermionD; + // Domain Wall fermions typedef DomainWallFermion DomainWallFermionR; typedef DomainWallFermion DomainWallFermionF; diff --git a/Grid/qcd/action/fermion/implementation/CompactWilsonCloverFermionImplementation.h b/Grid/qcd/action/fermion/implementation/CompactWilsonCloverFermionImplementation.h new file mode 100644 index 00000000..3dfcb133 --- /dev/null +++ b/Grid/qcd/action/fermion/implementation/CompactWilsonCloverFermionImplementation.h @@ -0,0 +1,363 @@ +/************************************************************************************* + + Grid physics library, www.github.com/paboyle/Grid + + Source file: ./lib/qcd/action/fermion/CompactWilsonCloverFermionImplementation.h + + Copyright (C) 2017 - 2022 + + Author: paboyle + Author: Guido Cossu + Author: Daniel Richtmann + + This program is free software; you can redistribute it and/or modify + it under the terms of the GNU General Public License as published by + the Free Software Foundation; either version 2 of the License, or + (at your option) any later version. + + This program is distributed in the hope that it will be useful, + but WITHOUT ANY WARRANTY; without even the implied warranty of + MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + GNU General Public License for more details. + + You should have received a copy of the GNU General Public License along + with this program; if not, write to the Free Software Foundation, Inc., + 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. + + See the full license in the file "LICENSE" in the top level distribution directory + *************************************************************************************/ +/* END LEGAL */ + +#include +#include +#include + +NAMESPACE_BEGIN(Grid); +template +CompactWilsonCloverFermion::CompactWilsonCloverFermion(GaugeField& _Umu, + GridCartesian& Fgrid, + GridRedBlackCartesian& Hgrid, + const RealD _mass, + const RealD _csw_r, + const RealD _csw_t, + const RealD _cF, + const WilsonAnisotropyCoefficients& clover_anisotropy, + const ImplParams& impl_p) + : WilsonBase(_Umu, Fgrid, Hgrid, _mass, impl_p, clover_anisotropy) + , csw_r(_csw_r) + , csw_t(_csw_t) + , cF(_cF) + , open_boundaries(impl_p.boundary_phases[Nd-1] == 0.0) + , Diagonal(&Fgrid), Triangle(&Fgrid) + , DiagonalEven(&Hgrid), TriangleEven(&Hgrid) + , DiagonalOdd(&Hgrid), TriangleOdd(&Hgrid) + , DiagonalInv(&Fgrid), TriangleInv(&Fgrid) + , DiagonalInvEven(&Hgrid), TriangleInvEven(&Hgrid) + , DiagonalInvOdd(&Hgrid), TriangleInvOdd(&Hgrid) + , Tmp(&Fgrid) + , BoundaryMask(&Fgrid) + , BoundaryMaskEven(&Hgrid), BoundaryMaskOdd(&Hgrid) +{ + csw_r *= 0.5; + csw_t *= 0.5; + if (clover_anisotropy.isAnisotropic) + csw_r /= clover_anisotropy.xi_0; + + ImportGauge(_Umu); + if (open_boundaries) + CompactHelpers::SetupMasks(this->BoundaryMask, this->BoundaryMaskEven, this->BoundaryMaskOdd); +} + +template +void CompactWilsonCloverFermion::Dhop(const FermionField& in, FermionField& out, int dag) { + WilsonBase::Dhop(in, out, dag); + if(open_boundaries) ApplyBoundaryMask(out); +} + +template +void CompactWilsonCloverFermion::DhopOE(const FermionField& in, FermionField& out, int dag) { + WilsonBase::DhopOE(in, out, dag); + if(open_boundaries) ApplyBoundaryMask(out); +} + +template +void CompactWilsonCloverFermion::DhopEO(const FermionField& in, FermionField& out, int dag) { + WilsonBase::DhopEO(in, out, dag); + if(open_boundaries) ApplyBoundaryMask(out); +} + +template +void CompactWilsonCloverFermion::DhopDir(const FermionField& in, FermionField& out, int dir, int disp) { + WilsonBase::DhopDir(in, out, dir, disp); + if(this->open_boundaries) ApplyBoundaryMask(out); +} + +template +void CompactWilsonCloverFermion::DhopDirAll(const FermionField& in, std::vector& out) { + WilsonBase::DhopDirAll(in, out); + if(this->open_boundaries) { + for(auto& o : out) ApplyBoundaryMask(o); + } +} + +template +void CompactWilsonCloverFermion::M(const FermionField& in, FermionField& out) { + out.Checkerboard() = in.Checkerboard(); + WilsonBase::Dhop(in, out, DaggerNo); // call base to save applying bc + Mooee(in, Tmp); + axpy(out, 1.0, out, Tmp); + if(open_boundaries) ApplyBoundaryMask(out); +} + +template +void CompactWilsonCloverFermion::Mdag(const FermionField& in, FermionField& out) { + out.Checkerboard() = in.Checkerboard(); + WilsonBase::Dhop(in, out, DaggerYes); // call base to save applying bc + MooeeDag(in, Tmp); + axpy(out, 1.0, out, Tmp); + if(open_boundaries) ApplyBoundaryMask(out); +} + +template +void CompactWilsonCloverFermion::Meooe(const FermionField& in, FermionField& out) { + WilsonBase::Meooe(in, out); + if(open_boundaries) ApplyBoundaryMask(out); +} + +template +void CompactWilsonCloverFermion::MeooeDag(const FermionField& in, FermionField& out) { + WilsonBase::MeooeDag(in, out); + if(open_boundaries) ApplyBoundaryMask(out); +} + +template +void CompactWilsonCloverFermion::Mooee(const FermionField& in, FermionField& out) { + if(in.Grid()->_isCheckerBoarded) { + if(in.Checkerboard() == Odd) { + MooeeInternal(in, out, DiagonalOdd, TriangleOdd); + } else { + MooeeInternal(in, out, DiagonalEven, TriangleEven); + } + } else { + MooeeInternal(in, out, Diagonal, Triangle); + } + if(open_boundaries) ApplyBoundaryMask(out); +} + +template +void CompactWilsonCloverFermion::MooeeDag(const FermionField& in, FermionField& out) { + Mooee(in, out); // blocks are hermitian +} + +template +void CompactWilsonCloverFermion::MooeeInv(const FermionField& in, FermionField& out) { + if(in.Grid()->_isCheckerBoarded) { + if(in.Checkerboard() == Odd) { + MooeeInternal(in, out, DiagonalInvOdd, TriangleInvOdd); + } else { + MooeeInternal(in, out, DiagonalInvEven, TriangleInvEven); + } + } else { + MooeeInternal(in, out, DiagonalInv, TriangleInv); + } + if(open_boundaries) ApplyBoundaryMask(out); +} + +template +void CompactWilsonCloverFermion::MooeeInvDag(const FermionField& in, FermionField& out) { + MooeeInv(in, out); // blocks are hermitian +} + +template +void CompactWilsonCloverFermion::Mdir(const FermionField& in, FermionField& out, int dir, int disp) { + DhopDir(in, out, dir, disp); +} + +template +void CompactWilsonCloverFermion::MdirAll(const FermionField& in, std::vector& out) { + DhopDirAll(in, out); +} + +template +void CompactWilsonCloverFermion::MDeriv(GaugeField& force, const FermionField& X, const FermionField& Y, int dag) { + assert(!open_boundaries); // TODO check for changes required for open bc + + // NOTE: code copied from original clover term + conformable(X.Grid(), Y.Grid()); + conformable(X.Grid(), force.Grid()); + GaugeLinkField force_mu(force.Grid()), lambda(force.Grid()); + GaugeField clover_force(force.Grid()); + PropagatorField Lambda(force.Grid()); + + // Guido: Here we are hitting some performance issues: + // need to extract the components of the DoubledGaugeField + // for each call + // Possible solution + // Create a vector object to store them? (cons: wasting space) + std::vector U(Nd, this->Umu.Grid()); + + Impl::extractLinkField(U, this->Umu); + + force = Zero(); + // Derivative of the Wilson hopping term + this->DhopDeriv(force, X, Y, dag); + + /////////////////////////////////////////////////////////// + // Clover term derivative + /////////////////////////////////////////////////////////// + Impl::outerProductImpl(Lambda, X, Y); + //std::cout << "Lambda:" << Lambda << std::endl; + + Gamma::Algebra sigma[] = { + Gamma::Algebra::SigmaXY, + Gamma::Algebra::SigmaXZ, + Gamma::Algebra::SigmaXT, + Gamma::Algebra::MinusSigmaXY, + Gamma::Algebra::SigmaYZ, + Gamma::Algebra::SigmaYT, + Gamma::Algebra::MinusSigmaXZ, + Gamma::Algebra::MinusSigmaYZ, + Gamma::Algebra::SigmaZT, + Gamma::Algebra::MinusSigmaXT, + Gamma::Algebra::MinusSigmaYT, + Gamma::Algebra::MinusSigmaZT}; + + /* + sigma_{\mu \nu}= + | 0 sigma[0] sigma[1] sigma[2] | + | sigma[3] 0 sigma[4] sigma[5] | + | sigma[6] sigma[7] 0 sigma[8] | + | sigma[9] sigma[10] sigma[11] 0 | + */ + + int count = 0; + clover_force = Zero(); + for (int mu = 0; mu < 4; mu++) + { + force_mu = Zero(); + for (int nu = 0; nu < 4; nu++) + { + if (mu == nu) + continue; + + RealD factor; + if (nu == 4 || mu == 4) + { + factor = 2.0 * csw_t; + } + else + { + factor = 2.0 * csw_r; + } + PropagatorField Slambda = Gamma(sigma[count]) * Lambda; // sigma checked + Impl::TraceSpinImpl(lambda, Slambda); // traceSpin ok + force_mu -= factor*Helpers::Cmunu(U, lambda, mu, nu); // checked + count++; + } + + pokeLorentz(clover_force, U[mu] * force_mu, mu); + } + //clover_force *= csw; + force += clover_force; +} + +template +void CompactWilsonCloverFermion::MooDeriv(GaugeField& mat, const FermionField& U, const FermionField& V, int dag) { + assert(0); +} + +template +void CompactWilsonCloverFermion::MeeDeriv(GaugeField& mat, const FermionField& U, const FermionField& V, int dag) { + assert(0); +} + +template +void CompactWilsonCloverFermion::MooeeInternal(const FermionField& in, + FermionField& out, + const CloverDiagonalField& diagonal, + const CloverTriangleField& triangle) { + assert(in.Checkerboard() == Odd || in.Checkerboard() == Even); + out.Checkerboard() = in.Checkerboard(); + conformable(in, out); + conformable(in, diagonal); + conformable(in, triangle); + + CompactHelpers::MooeeKernel(diagonal.oSites(), 1, in, out, diagonal, triangle); +} + +template +void CompactWilsonCloverFermion::ImportGauge(const GaugeField& _Umu) { + // NOTE: parts copied from original implementation + + // Import gauge into base class + double t0 = usecond(); + WilsonBase::ImportGauge(_Umu); // NOTE: called here and in wilson constructor -> performed twice, but can't avoid that + + // Initialize temporary variables + double t1 = usecond(); + conformable(_Umu.Grid(), this->GaugeGrid()); + GridBase* grid = _Umu.Grid(); + typename Impl::GaugeLinkField Bx(grid), By(grid), Bz(grid), Ex(grid), Ey(grid), Ez(grid); + CloverField TmpOriginal(grid); + + // Compute the field strength terms mu>nu + double t2 = usecond(); + WilsonLoops::FieldStrength(Bx, _Umu, Zdir, Ydir); + WilsonLoops::FieldStrength(By, _Umu, Zdir, Xdir); + WilsonLoops::FieldStrength(Bz, _Umu, Ydir, Xdir); + WilsonLoops::FieldStrength(Ex, _Umu, Tdir, Xdir); + WilsonLoops::FieldStrength(Ey, _Umu, Tdir, Ydir); + WilsonLoops::FieldStrength(Ez, _Umu, Tdir, Zdir); + + // Compute the Clover Operator acting on Colour and Spin + // multiply here by the clover coefficients for the anisotropy + double t3 = usecond(); + TmpOriginal = Helpers::fillCloverYZ(Bx) * csw_r; + TmpOriginal += Helpers::fillCloverXZ(By) * csw_r; + TmpOriginal += Helpers::fillCloverXY(Bz) * csw_r; + TmpOriginal += Helpers::fillCloverXT(Ex) * csw_t; + TmpOriginal += Helpers::fillCloverYT(Ey) * csw_t; + TmpOriginal += Helpers::fillCloverZT(Ez) * csw_t; + TmpOriginal += this->diag_mass; + + // Convert the data layout of the clover term + double t4 = usecond(); + CompactHelpers::ConvertLayout(TmpOriginal, Diagonal, Triangle); + + // Possible modify the boundary values + double t5 = usecond(); + if(open_boundaries) CompactHelpers::ModifyBoundaries(Diagonal, Triangle, csw_t, cF, this->diag_mass); + + // Invert the clover term in the improved layout + double t6 = usecond(); + CompactHelpers::Invert(Diagonal, Triangle, DiagonalInv, TriangleInv); + + // Fill the remaining clover fields + double t7 = usecond(); + pickCheckerboard(Even, DiagonalEven, Diagonal); + pickCheckerboard(Even, TriangleEven, Triangle); + pickCheckerboard(Odd, DiagonalOdd, Diagonal); + pickCheckerboard(Odd, TriangleOdd, Triangle); + pickCheckerboard(Even, DiagonalInvEven, DiagonalInv); + pickCheckerboard(Even, TriangleInvEven, TriangleInv); + pickCheckerboard(Odd, DiagonalInvOdd, DiagonalInv); + pickCheckerboard(Odd, TriangleInvOdd, TriangleInv); + + // Report timings + double t8 = usecond(); +#if 0 + std::cout << GridLogMessage << "CompactWilsonCloverFermion::ImportGauge timings:" + << " WilsonFermion::Importgauge = " << (t1 - t0) / 1e6 + << ", allocations = " << (t2 - t1) / 1e6 + << ", field strength = " << (t3 - t2) / 1e6 + << ", fill clover = " << (t4 - t3) / 1e6 + << ", convert = " << (t5 - t4) / 1e6 + << ", boundaries = " << (t6 - t5) / 1e6 + << ", inversions = " << (t7 - t6) / 1e6 + << ", pick cbs = " << (t8 - t7) / 1e6 + << ", total = " << (t8 - t0) / 1e6 + << std::endl; +#endif +} + +NAMESPACE_END(Grid); diff --git a/Grid/qcd/action/fermion/instantiation/CompactWilsonCloverFermionInstantiation.cc.master b/Grid/qcd/action/fermion/instantiation/CompactWilsonCloverFermionInstantiation.cc.master new file mode 100644 index 00000000..7c91c252 --- /dev/null +++ b/Grid/qcd/action/fermion/instantiation/CompactWilsonCloverFermionInstantiation.cc.master @@ -0,0 +1,41 @@ +/************************************************************************************* + + Grid physics library, www.github.com/paboyle/Grid + + Source file: ./lib/ qcd/action/fermion/instantiation/CompactWilsonCloverFermionInstantiation.cc.master + + Copyright (C) 2017 - 2022 + + Author: paboyle + Author: Guido Cossu + Author: Daniel Richtmann + + This program is free software; you can redistribute it and/or modify + it under the terms of the GNU General Public License as published by + the Free Software Foundation; either version 2 of the License, or + (at your option) any later version. + + This program is distributed in the hope that it will be useful, + but WITHOUT ANY WARRANTY; without even the implied warranty of + MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + GNU General Public License for more details. + + You should have received a copy of the GNU General Public License along + with this program; if not, write to the Free Software Foundation, Inc., + 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. + + See the full license in the file "LICENSE" in the top level distribution directory + *************************************************************************************/ +/* END LEGAL */ + +#include +#include +#include +#include + +NAMESPACE_BEGIN(Grid); + +#include "impl.h" +template class CompactWilsonCloverFermion; + +NAMESPACE_END(Grid); diff --git a/Grid/qcd/action/fermion/instantiation/GparityWilsonImplD/CompactWilsonCloverFermionInstantiationGparityWilsonImplD.cc b/Grid/qcd/action/fermion/instantiation/GparityWilsonImplD/CompactWilsonCloverFermionInstantiationGparityWilsonImplD.cc new file mode 120000 index 00000000..a739bb99 --- /dev/null +++ b/Grid/qcd/action/fermion/instantiation/GparityWilsonImplD/CompactWilsonCloverFermionInstantiationGparityWilsonImplD.cc @@ -0,0 +1 @@ +../CompactWilsonCloverFermionInstantiation.cc.master \ No newline at end of file diff --git a/Grid/qcd/action/fermion/instantiation/GparityWilsonImplF/CompactWilsonCloverFermionInstantiationGparityWilsonImplF.cc b/Grid/qcd/action/fermion/instantiation/GparityWilsonImplF/CompactWilsonCloverFermionInstantiationGparityWilsonImplF.cc new file mode 120000 index 00000000..a739bb99 --- /dev/null +++ b/Grid/qcd/action/fermion/instantiation/GparityWilsonImplF/CompactWilsonCloverFermionInstantiationGparityWilsonImplF.cc @@ -0,0 +1 @@ +../CompactWilsonCloverFermionInstantiation.cc.master \ No newline at end of file diff --git a/Grid/qcd/action/fermion/instantiation/WilsonAdjImplD/CompactWilsonCloverFermionInstantiationWilsonAdjImplD.cc b/Grid/qcd/action/fermion/instantiation/WilsonAdjImplD/CompactWilsonCloverFermionInstantiationWilsonAdjImplD.cc new file mode 120000 index 00000000..a739bb99 --- /dev/null +++ b/Grid/qcd/action/fermion/instantiation/WilsonAdjImplD/CompactWilsonCloverFermionInstantiationWilsonAdjImplD.cc @@ -0,0 +1 @@ +../CompactWilsonCloverFermionInstantiation.cc.master \ No newline at end of file diff --git a/Grid/qcd/action/fermion/instantiation/WilsonAdjImplF/CompactWilsonCloverFermionInstantiationWilsonAdjImplF.cc b/Grid/qcd/action/fermion/instantiation/WilsonAdjImplF/CompactWilsonCloverFermionInstantiationWilsonAdjImplF.cc new file mode 120000 index 00000000..a739bb99 --- /dev/null +++ b/Grid/qcd/action/fermion/instantiation/WilsonAdjImplF/CompactWilsonCloverFermionInstantiationWilsonAdjImplF.cc @@ -0,0 +1 @@ +../CompactWilsonCloverFermionInstantiation.cc.master \ No newline at end of file diff --git a/Grid/qcd/action/fermion/instantiation/WilsonImplD/CompactWilsonCloverFermionInstantiationWilsonImplD.cc b/Grid/qcd/action/fermion/instantiation/WilsonImplD/CompactWilsonCloverFermionInstantiationWilsonImplD.cc new file mode 120000 index 00000000..a739bb99 --- /dev/null +++ b/Grid/qcd/action/fermion/instantiation/WilsonImplD/CompactWilsonCloverFermionInstantiationWilsonImplD.cc @@ -0,0 +1 @@ +../CompactWilsonCloverFermionInstantiation.cc.master \ No newline at end of file diff --git a/Grid/qcd/action/fermion/instantiation/WilsonImplF/CompactWilsonCloverFermionInstantiationWilsonImplF.cc b/Grid/qcd/action/fermion/instantiation/WilsonImplF/CompactWilsonCloverFermionInstantiationWilsonImplF.cc new file mode 120000 index 00000000..a739bb99 --- /dev/null +++ b/Grid/qcd/action/fermion/instantiation/WilsonImplF/CompactWilsonCloverFermionInstantiationWilsonImplF.cc @@ -0,0 +1 @@ +../CompactWilsonCloverFermionInstantiation.cc.master \ No newline at end of file diff --git a/Grid/qcd/action/fermion/instantiation/WilsonTwoIndexAntiSymmetricImplD/CompactWilsonCloverFermionInstantiationWilsonTwoIndexAntiSymmetricImplD.cc b/Grid/qcd/action/fermion/instantiation/WilsonTwoIndexAntiSymmetricImplD/CompactWilsonCloverFermionInstantiationWilsonTwoIndexAntiSymmetricImplD.cc new file mode 120000 index 00000000..a739bb99 --- /dev/null +++ b/Grid/qcd/action/fermion/instantiation/WilsonTwoIndexAntiSymmetricImplD/CompactWilsonCloverFermionInstantiationWilsonTwoIndexAntiSymmetricImplD.cc @@ -0,0 +1 @@ +../CompactWilsonCloverFermionInstantiation.cc.master \ No newline at end of file diff --git a/Grid/qcd/action/fermion/instantiation/WilsonTwoIndexAntiSymmetricImplF/CompactWilsonCloverFermionInstantiationWilsonTwoIndexAntiSymmetricImplF.cc b/Grid/qcd/action/fermion/instantiation/WilsonTwoIndexAntiSymmetricImplF/CompactWilsonCloverFermionInstantiationWilsonTwoIndexAntiSymmetricImplF.cc new file mode 120000 index 00000000..a739bb99 --- /dev/null +++ b/Grid/qcd/action/fermion/instantiation/WilsonTwoIndexAntiSymmetricImplF/CompactWilsonCloverFermionInstantiationWilsonTwoIndexAntiSymmetricImplF.cc @@ -0,0 +1 @@ +../CompactWilsonCloverFermionInstantiation.cc.master \ No newline at end of file diff --git a/Grid/qcd/action/fermion/instantiation/WilsonTwoIndexSymmetricImplD/CompactWilsonCloverFermionInstantiationWilsonTwoIndexSymmetricImplD.cc b/Grid/qcd/action/fermion/instantiation/WilsonTwoIndexSymmetricImplD/CompactWilsonCloverFermionInstantiationWilsonTwoIndexSymmetricImplD.cc new file mode 120000 index 00000000..a739bb99 --- /dev/null +++ b/Grid/qcd/action/fermion/instantiation/WilsonTwoIndexSymmetricImplD/CompactWilsonCloverFermionInstantiationWilsonTwoIndexSymmetricImplD.cc @@ -0,0 +1 @@ +../CompactWilsonCloverFermionInstantiation.cc.master \ No newline at end of file diff --git a/Grid/qcd/action/fermion/instantiation/WilsonTwoIndexSymmetricImplF/CompactWilsonCloverFermionInstantiationWilsonTwoIndexSymmetricImplF.cc b/Grid/qcd/action/fermion/instantiation/WilsonTwoIndexSymmetricImplF/CompactWilsonCloverFermionInstantiationWilsonTwoIndexSymmetricImplF.cc new file mode 120000 index 00000000..a739bb99 --- /dev/null +++ b/Grid/qcd/action/fermion/instantiation/WilsonTwoIndexSymmetricImplF/CompactWilsonCloverFermionInstantiationWilsonTwoIndexSymmetricImplF.cc @@ -0,0 +1 @@ +../CompactWilsonCloverFermionInstantiation.cc.master \ No newline at end of file diff --git a/Grid/qcd/action/fermion/instantiation/generate_instantiations.sh b/Grid/qcd/action/fermion/instantiation/generate_instantiations.sh index d7553cdb..a09fd420 100755 --- a/Grid/qcd/action/fermion/instantiation/generate_instantiations.sh +++ b/Grid/qcd/action/fermion/instantiation/generate_instantiations.sh @@ -40,7 +40,7 @@ EOF done -CC_LIST="WilsonCloverFermionInstantiation WilsonFermionInstantiation WilsonKernelsInstantiation WilsonTMFermionInstantiation" +CC_LIST="WilsonCloverFermionInstantiation CompactWilsonCloverFermionInstantiation WilsonFermionInstantiation WilsonKernelsInstantiation WilsonTMFermionInstantiation" for impl in $WILSON_IMPL_LIST do