/************************************************************************************* Grid physics library, www.github.com/paboyle/Grid Source file: ./lib/qcd/action/fermion/WilsonCompressor.h Copyright (C) 2015 Author: Peter Boyle Author: Peter Boyle Author: paboyle This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 2 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. See the full license in the file "LICENSE" in the top level distribution directory *************************************************************************************/ /* END LEGAL */ #ifndef GRID_QCD_WILSON_COMPRESSOR_H #define GRID_QCD_WILSON_COMPRESSOR_H namespace Grid { namespace QCD { template class WilsonCompressor { public: int mu; int dag; WilsonCompressor(int _dag){ mu=0; dag=_dag; assert((dag==0)||(dag==1)); } void Point(int p) { mu=p; }; inline SiteHalfSpinor operator () (const SiteSpinor &in) { SiteHalfSpinor ret; int mudag=mu; if (!dag) { mudag=(mu+Nd)%(2*Nd); } switch(mudag) { case Xp: spProjXp(ret,in); break; case Yp: spProjYp(ret,in); break; case Zp: spProjZp(ret,in); break; case Tp: spProjTp(ret,in); break; case Xm: spProjXm(ret,in); break; case Ym: spProjYm(ret,in); break; case Zm: spProjZm(ret,in); break; case Tm: spProjTm(ret,in); break; default: assert(0); break; } return ret; } }; ///////////////////////// // optimised versions ///////////////////////// template class WilsonXpCompressor { public: inline SiteHalfSpinor operator () (const SiteSpinor &in) { SiteHalfSpinor ret; spProjXp(ret,in); return ret; } }; template class WilsonYpCompressor { public: inline SiteHalfSpinor operator () (const SiteSpinor &in) { SiteHalfSpinor ret; spProjYp(ret,in); return ret; } }; template class WilsonZpCompressor { public: inline SiteHalfSpinor operator () (const SiteSpinor &in) { SiteHalfSpinor ret; spProjZp(ret,in); return ret; } }; template class WilsonTpCompressor { public: inline SiteHalfSpinor operator () (const SiteSpinor &in) { SiteHalfSpinor ret; spProjTp(ret,in); return ret; } }; template class WilsonXmCompressor { public: inline SiteHalfSpinor operator () (const SiteSpinor &in) { SiteHalfSpinor ret; spProjXm(ret,in); return ret; } }; template class WilsonYmCompressor { public: inline SiteHalfSpinor operator () (const SiteSpinor &in) { SiteHalfSpinor ret; spProjYm(ret,in); return ret; } }; template class WilsonZmCompressor { public: inline SiteHalfSpinor operator () (const SiteSpinor &in) { SiteHalfSpinor ret; spProjZm(ret,in); return ret; } }; template class WilsonTmCompressor { public: inline SiteHalfSpinor operator () (const SiteSpinor &in) { SiteHalfSpinor ret; spProjTm(ret,in); return ret; } }; // Fast comms buffer manipulation which should inline right through (avoid direction // dependent logic that prevents inlining template class WilsonStencil : public CartesianStencil { public: WilsonStencil(GridBase *grid, int npoints, int checkerboard, const std::vector &directions, const std::vector &distances) : CartesianStencil (grid,npoints,checkerboard,directions,distances) { }; template < class compressor> std::thread HaloExchangeOptBegin(const Lattice &source,compressor &compress) { this->Mergers.resize(0); this->Packets.resize(0); this->HaloGatherOpt(source,compress); return std::thread([&] { this->Communicate(); }); } template < class compressor> void HaloExchangeOpt(const Lattice &source,compressor &compress) { auto thr = this->HaloExchangeOptBegin(source,compress); this->HaloExchangeOptComplete(thr); } void HaloExchangeOptComplete(std::thread &thr) { this->CommsMerge(); // spins this->jointime-=usecond(); thr.join(); this->jointime+=usecond(); } template < class compressor> void HaloGatherOpt(const Lattice &source,compressor &compress) { // conformable(source._grid,_grid); assert(source._grid==this->_grid); this->halogtime-=usecond(); assert (this->comm_buf.size() == this->_unified_buffer_size ); this->u_comm_offset=0; int dag = compress.dag; static std::vector dirs(Nd*2); for(int mu=0;mu XpCompress; this->HaloGatherDir(source,XpCompress,dirs[0]); WilsonYpCompressor YpCompress; this->HaloGatherDir(source,YpCompress,dirs[1]); WilsonZpCompressor ZpCompress; this->HaloGatherDir(source,ZpCompress,dirs[2]); WilsonTpCompressor TpCompress; this->HaloGatherDir(source,TpCompress,dirs[3]); WilsonXmCompressor XmCompress; this->HaloGatherDir(source,XmCompress,dirs[4]); WilsonYmCompressor YmCompress; this->HaloGatherDir(source,YmCompress,dirs[5]); WilsonZmCompressor ZmCompress; this->HaloGatherDir(source,ZmCompress,dirs[6]); WilsonTmCompressor TmCompress; this->HaloGatherDir(source,TmCompress,dirs[7]); assert(this->u_comm_offset==this->_unified_buffer_size); this->halogtime+=usecond(); } }; }} // namespace close #endif