/************************************************************************************* Grid physics library, www.github.com/paboyle/Grid Source file: ./lib/qcd/action/fermion/WilsonKernelsAsmAvx512.h Copyright (C) 2015 Author: Peter Boyle Author: paboyle This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 2 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. See the full license in the file "LICENSE" in the top level distribution directory *************************************************************************************/ /* END LEGAL */ #if defined(AVX512) /////////////////////////////////////////////////////////// // If we are AVX512 specialise the single precision routine /////////////////////////////////////////////////////////// #include #include static Vector signsF; template int setupSigns(Vector& signs ){ Vector bother(2); signs = bother; vrsign(signs[0]); visign(signs[1]); return 1; } static int signInitF = setupSigns(signsF); #define MAYBEPERM(A,perm) if (perm) { A ; } #define MULT_2SPIN(ptr,pf) MULT_ADDSUB_2SPIN(ptr,pf) #define COMPLEX_SIGNS(isigns) vComplexF *isigns = &signsF[0]; ///////////////////////////////////////////////////////////////// // XYZT vectorised, undag Kernel, single ///////////////////////////////////////////////////////////////// #undef KERNEL_DAG template<> void WilsonKernels::DiracOptAsmDhopSite(StencilImpl &st,LebesgueOrder & lo,DoubledGaugeField &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionField &in, FermionField &out) #include ///////////////////////////////////////////////////////////////// // XYZT vectorised, dag Kernel, single ///////////////////////////////////////////////////////////////// #define KERNEL_DAG template<> void WilsonKernels::DiracOptAsmDhopSiteDag(StencilImpl &st,LebesgueOrder & lo,DoubledGaugeField &U,SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionField &in, FermionField &out) #include #undef MAYBEPERM #undef MULT_2SPIN #define MAYBEPERM(A,B) #define MULT_2SPIN(ptr,pf) MULT_ADDSUB_2SPIN_LS(ptr,pf) ///////////////////////////////////////////////////////////////// // Ls vectorised, undag Kernel, single ///////////////////////////////////////////////////////////////// #undef KERNEL_DAG template<> void WilsonKernels::DiracOptAsmDhopSite(StencilImpl &st,LebesgueOrder & lo,DoubledGaugeField &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionField &in, FermionField &out) #include ///////////////////////////////////////////////////////////////// // Ls vectorised, dag Kernel, single ///////////////////////////////////////////////////////////////// #define KERNEL_DAG template<> void WilsonKernels::DiracOptAsmDhopSiteDag(StencilImpl &st,LebesgueOrder & lo,DoubledGaugeField &U,SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionField &in, FermionField &out) #include #undef COMPLEX_SIGNS #undef MAYBEPERM #undef MULT_2SPIN /////////////////////////////////////////////////////////// // If we are AVX512 specialise the double precision routine /////////////////////////////////////////////////////////// #include static Vector signsD; static int signInitD = setupSigns(signsD); #define MAYBEPERM(A,perm) if (perm) { A ; } #define MULT_2SPIN(ptr,pf) MULT_ADDSUB_2SPIN(ptr,pf) #define COMPLEX_SIGNS(isigns) vComplexD *isigns = &signsD[0]; ///////////////////////////////////////////////////////////////// // XYZT Vectorised, undag Kernel, double ///////////////////////////////////////////////////////////////// #undef KERNEL_DAG template<> void WilsonKernels::DiracOptAsmDhopSite(StencilImpl &st,LebesgueOrder & lo,DoubledGaugeField &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionField &in, FermionField &out) #include ///////////////////////////////////////////////////////////////// ///////////////////////////////////////////////////////////////// // XYZT Vectorised, dag Kernel, double ///////////////////////////////////////////////////////////////// #define KERNEL_DAG template<> void WilsonKernels::DiracOptAsmDhopSiteDag(StencilImpl &st,LebesgueOrder & lo,DoubledGaugeField &U,SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionField &in, FermionField &out) #include ///////////////////////////////////////////////////////////////// #undef MAYBEPERM #undef MULT_2SPIN #define MAYBEPERM(A,B) #define MULT_2SPIN(ptr,pf) MULT_ADDSUB_2SPIN_LS(ptr,pf) ///////////////////////////////////////////////////////////////// // Ls vectorised, undag Kernel, double ///////////////////////////////////////////////////////////////// #undef KERNEL_DAG template<> void WilsonKernels::DiracOptAsmDhopSite(StencilImpl &st,LebesgueOrder & lo,DoubledGaugeField &U, SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionField &in, FermionField &out) #include ///////////////////////////////////////////////////////////////// ///////////////////////////////////////////////////////////////// // Ls vectorised, dag Kernel, double ///////////////////////////////////////////////////////////////// #define KERNEL_DAG template<> void WilsonKernels::DiracOptAsmDhopSiteDag(StencilImpl &st,LebesgueOrder & lo,DoubledGaugeField &U,SiteHalfSpinor *buf, int ss,int ssU,int Ls,int Ns,const FermionField &in, FermionField &out) #include ///////////////////////////////////////////////////////////////// #undef COMPLEX_SIGNS #undef MAYBEPERM #undef MULT_2SPIN #endif //AVX512