diff --git a/Grid/lattice/Lattice_reduction.h b/Grid/lattice/Lattice_reduction.h index bcd09c04..5f73e94b 100644 --- a/Grid/lattice/Lattice_reduction.h +++ b/Grid/lattice/Lattice_reduction.h @@ -92,9 +92,7 @@ inline typename vobj::scalar_objectD sumD_cpu(const vobj *arg, Integer osites) ssum = ssum+sumarray[i]; } - typedef typename vobj::scalar_object ssobj; - ssobj ret = ssum; - return ret; + return ssum; } /* Threaded max, don't use for now diff --git a/Grid/lattice/Lattice_transfer.h b/Grid/lattice/Lattice_transfer.h index aee55e93..de6ca886 100644 --- a/Grid/lattice/Lattice_transfer.h +++ b/Grid/lattice/Lattice_transfer.h @@ -1080,6 +1080,25 @@ vectorizeFromRevLexOrdArray( std::vector &in, Lattice &out) }); } +template +void precisionChangeFast(Lattice &out, const Lattice &in) +{ + typedef typename VobjOut::scalar_object SobjOut; + typedef typename VobjIn::scalar_object SobjIn; + conformable(out.Grid(),in.Grid()); + out.Checkerboard() = in.Checkerboard(); + int nsimd = out.Grid()->Nsimd(); + autoView( out_v , out, AcceleratorWrite); + autoView( in_v , in, AcceleratorRead); + accelerator_for(idx,out.Grid()->oSites(),nsimd,{ + auto itmp = coalescedRead(in_v[idx]); + auto otmp = coalescedRead(out_v[idx]); +#ifdef GRID_SIMT + otmp=itmp; +#endif + coalescedWrite(out_v[idx],otmp); + }); +} //Convert a Lattice from one precision to another template void precisionChange(Lattice &out, const Lattice &in)