1
0
mirror of https://github.com/paboyle/Grid.git synced 2025-04-04 11:15:55 +01:00

Small tweak to enable benchmarking to suppress gauge field bandwidth as a test.

This is a short term hack while I benchmark.
This commit is contained in:
Peter Boyle 2015-05-10 15:25:23 +01:00
parent 2ffd941d67
commit 02ae26d091

View File

@ -106,6 +106,7 @@ void WilsonMatrix::Dhop(const LatticeFermion &in, LatticeFermion &out)
for(int sss=0;sss<grid->oSites();sss++){ for(int sss=0;sss<grid->oSites();sss++){
int ss = sss; int ss = sss;
int ssu= sss;
//int ss = Stencil._LebesgueReorder[sss]; //int ss = Stencil._LebesgueReorder[sss];
// Xp // Xp
@ -123,7 +124,7 @@ void WilsonMatrix::Dhop(const LatticeFermion &in, LatticeFermion &out)
} else { } else {
chi=comm_buf[offset]; chi=comm_buf[offset];
} }
mult(&Uchi(),&Umu._odata[ss](Xp),&chi()); mult(&Uchi(),&Umu._odata[ssu](Xp),&chi());
spReconXp(result,Uchi); spReconXp(result,Uchi);
// Yp // Yp
@ -141,7 +142,7 @@ void WilsonMatrix::Dhop(const LatticeFermion &in, LatticeFermion &out)
} else { } else {
chi=comm_buf[offset]; chi=comm_buf[offset];
} }
mult(&Uchi(),&Umu._odata[ss](Yp),&chi()); mult(&Uchi(),&Umu._odata[ssu](Yp),&chi());
accumReconYp(result,Uchi); accumReconYp(result,Uchi);
// Zp // Zp
@ -159,7 +160,7 @@ void WilsonMatrix::Dhop(const LatticeFermion &in, LatticeFermion &out)
} else { } else {
chi=comm_buf[offset]; chi=comm_buf[offset];
} }
mult(&Uchi(),&Umu._odata[ss](Zp),&chi()); mult(&Uchi(),&Umu._odata[ssu](Zp),&chi());
accumReconZp(result,Uchi); accumReconZp(result,Uchi);
// Tp // Tp
@ -177,7 +178,7 @@ void WilsonMatrix::Dhop(const LatticeFermion &in, LatticeFermion &out)
} else { } else {
chi=comm_buf[offset]; chi=comm_buf[offset];
} }
mult(&Uchi(),&Umu._odata[ss](Tp),&chi()); mult(&Uchi(),&Umu._odata[ssu](Tp),&chi());
accumReconTp(result,Uchi); accumReconTp(result,Uchi);
// Xm // Xm
@ -195,7 +196,7 @@ void WilsonMatrix::Dhop(const LatticeFermion &in, LatticeFermion &out)
} else { } else {
chi=comm_buf[offset]; chi=comm_buf[offset];
} }
mult(&Uchi(),&Umu._odata[ss](Xm),&chi()); mult(&Uchi(),&Umu._odata[ssu](Xm),&chi());
accumReconXm(result,Uchi); accumReconXm(result,Uchi);
@ -214,7 +215,7 @@ void WilsonMatrix::Dhop(const LatticeFermion &in, LatticeFermion &out)
} else { } else {
chi=comm_buf[offset]; chi=comm_buf[offset];
} }
mult(&Uchi(),&Umu._odata[ss](Ym),&chi()); mult(&Uchi(),&Umu._odata[ssu](Ym),&chi());
accumReconYm(result,Uchi); accumReconYm(result,Uchi);
// Zm // Zm
@ -232,7 +233,7 @@ void WilsonMatrix::Dhop(const LatticeFermion &in, LatticeFermion &out)
} else { } else {
chi=comm_buf[offset]; chi=comm_buf[offset];
} }
mult(&Uchi(),&Umu._odata[ss](Zm),&chi()); mult(&Uchi(),&Umu._odata[ssu](Zm),&chi());
accumReconZm(result,Uchi); accumReconZm(result,Uchi);
// Tm // Tm
@ -250,7 +251,7 @@ void WilsonMatrix::Dhop(const LatticeFermion &in, LatticeFermion &out)
} else { } else {
chi=comm_buf[offset]; chi=comm_buf[offset];
} }
mult(&Uchi(),&Umu._odata[ss](Tm),&chi()); mult(&Uchi(),&Umu._odata[ssu](Tm),&chi());
accumReconTm(result,Uchi); accumReconTm(result,Uchi);
vstream(out._odata[ss],result); vstream(out._odata[ss],result);