From 64bf6fe54e1cea89d2c5c1d5976269ab44eefd5b Mon Sep 17 00:00:00 2001 From: Antonin Portelli Date: Wed, 4 May 2016 12:14:38 -0700 Subject: [PATCH 1/7] macro to dump NERSC header to a stream --- lib/parallelIO/NerscIO.h | 53 ++++++++++++++++++++-------------------- 1 file changed, 27 insertions(+), 26 deletions(-) diff --git a/lib/parallelIO/NerscIO.h b/lib/parallelIO/NerscIO.h index 9c280397..79572539 100644 --- a/lib/parallelIO/NerscIO.h +++ b/lib/parallelIO/NerscIO.h @@ -213,37 +213,38 @@ class NerscIO : public BinaryIO { static inline void truncate(std::string file){ std::ofstream fout(file,std::ios::out); } + + #define dump_nersc_header(field, s)\ + s << "BEGIN_HEADER" << std::endl;\ + s << "HDR_VERSION = " << field.hdr_version << std::endl;\ + s << "DATATYPE = " << field.data_type << std::endl;\ + s << "STORAGE_FORMAT = " << field.storage_format << std::endl;\ + for(int i=0;i<4;i++){\ + s << "DIMENSION_" << i+1 << " = " << field.dimension[i] << std::endl ;\ + }\ + s << "LINK_TRACE = " << std::setprecision(10) << field.link_trace << std::endl;\ + s << "PLAQUETTE = " << std::setprecision(10) << field.plaquette << std::endl;\ + for(int i=0;i<4;i++){\ + s << "BOUNDARY_"< Date: Wed, 4 May 2016 12:14:49 -0700 Subject: [PATCH 2/7] log polish --- lib/Log.h | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/lib/Log.h b/lib/Log.h index e55c2e52..70ccf6ed 100644 --- a/lib/Log.h +++ b/lib/Log.h @@ -69,10 +69,10 @@ public: StopWatch.Stop(); GridTime now = StopWatch.Elapsed(); StopWatch.Start(); - stream << BLACK<< log.topName << BLACK<< " : "; - stream << log.COLOUR < Date: Wed, 4 May 2016 12:15:31 -0700 Subject: [PATCH 3/7] LatticeBase contain the grid pointer and a virtual destructor to allow polymorphic lattice pointers --- lib/lattice/Lattice_base.h | 25 +++++++++++++++++-------- 1 file changed, 17 insertions(+), 8 deletions(-) diff --git a/lib/lattice/Lattice_base.h b/lib/lattice/Lattice_base.h index 8812a975..d97b1204 100644 --- a/lib/lattice/Lattice_base.h +++ b/lib/lattice/Lattice_base.h @@ -55,7 +55,13 @@ extern int GridCshiftPermuteMap[4][16]; // Basic expressions used in Expression Template //////////////////////////////////////////////// -class LatticeBase {}; +class LatticeBase +{ +public: + virtual ~LatticeBase(void) = default; + GridBase *_grid; +}; + class LatticeExpressionBase {}; template using Vector = std::vector >; // Aligned allocator?? @@ -88,8 +94,6 @@ template class Lattice : public LatticeBase { public: - - GridBase *_grid; int checkerboard; Vector _odata; @@ -177,8 +181,8 @@ PARALLEL_FOR_LOOP } //GridFromExpression is tricky to do template - Lattice(const LatticeUnaryExpression & expr): _grid(nullptr){ - + Lattice(const LatticeUnaryExpression & expr) { + _grid = nullptr; GridFromExpression(_grid,expr); assert(_grid!=nullptr); @@ -199,7 +203,8 @@ PARALLEL_FOR_LOOP } }; template - Lattice(const LatticeBinaryExpression & expr): _grid(nullptr){ + Lattice(const LatticeBinaryExpression & expr) { + _grid = nullptr; GridFromExpression(_grid,expr); assert(_grid!=nullptr); @@ -220,7 +225,8 @@ PARALLEL_FOR_LOOP } }; template - Lattice(const LatticeTrinaryExpression & expr): _grid(nullptr){ + Lattice(const LatticeTrinaryExpression & expr) { + _grid = nullptr; GridFromExpression(_grid,expr); assert(_grid!=nullptr); @@ -240,7 +246,8 @@ PARALLEL_FOR_LOOP // Constructor requires "grid" passed. // what about a default grid? ////////////////////////////////////////////////////////////////// - Lattice(GridBase *grid) : _grid(grid), _odata(_grid->oSites()) { + Lattice(GridBase *grid) : _odata(grid->oSites()) { + _grid = grid; // _odata.reserve(_grid->oSites()); // _odata.resize(_grid->oSites()); // std::cout << "Constructing lattice object with Grid pointer "<<_grid< strong_inline Lattice & operator = (const sobj & r){ PARALLEL_FOR_LOOP for(int ss=0;ss<_grid->oSites();ss++){ From 4bc21ec7cbc8162c9b65e9ff9eecc785aabffed0 Mon Sep 17 00:00:00 2001 From: Antonin Portelli Date: Wed, 11 May 2016 15:21:29 +0100 Subject: [PATCH 4/7] thread CL argument fix --- lib/Init.cc | 6 +++++- 1 file changed, 5 insertions(+), 1 deletion(-) diff --git a/lib/Init.cc b/lib/Init.cc index fd50c4d5..72d79905 100644 --- a/lib/Init.cc +++ b/lib/Init.cc @@ -144,6 +144,10 @@ void GridParseLayout(char **argv,int argc, } if( GridCmdOptionExists(argv,argv+argc,"--threads") ){ std::vector ompthreads(0); +#ifndef GRID_OMP + std::cout << GridLogWarning << "'--threads' option used but Grid was" + << " not compiled with thread support" << std::endl; +#endif arg= GridCmdOptionPayload(argv,argv+argc,"--threads"); GridCmdOptionIntVector(arg,ompthreads); assert(ompthreads.size()==1); @@ -187,7 +191,7 @@ void Grid_init(int *argc,char ***argv) std::cout< Date: Thu, 12 May 2016 13:01:35 +0100 Subject: [PATCH 5/7] const fix in slice functions --- lib/lattice/Lattice_transfer.h | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/lib/lattice/Lattice_transfer.h b/lib/lattice/Lattice_transfer.h index 178b5937..760f90ec 100644 --- a/lib/lattice/Lattice_transfer.h +++ b/lib/lattice/Lattice_transfer.h @@ -361,7 +361,7 @@ PARALLEL_FOR_LOOP template -void InsertSlice(const Lattice &lowDim,Lattice & higherDim,int slice, int orthog) +void InsertSlice(Lattice &lowDim,Lattice & higherDim,int slice, int orthog) { typedef typename vobj::scalar_object sobj; sobj s; @@ -404,7 +404,7 @@ PARALLEL_FOR_LOOP } template -void ExtractSlice(Lattice &lowDim,const Lattice & higherDim,int slice, int orthog) +void ExtractSlice(Lattice &lowDim, Lattice & higherDim,int slice, int orthog) { typedef typename vobj::scalar_object sobj; sobj s; From 3789e3f31ce639607225bfea2c0db70dfcec7361 Mon Sep 17 00:00:00 2001 From: Antonin Portelli Date: Thu, 12 May 2016 18:35:38 +0100 Subject: [PATCH 6/7] additional fixed in slice functions --- lib/lattice/Lattice_transfer.h | 12 ++++++------ 1 file changed, 6 insertions(+), 6 deletions(-) diff --git a/lib/lattice/Lattice_transfer.h b/lib/lattice/Lattice_transfer.h index 760f90ec..638563a9 100644 --- a/lib/lattice/Lattice_transfer.h +++ b/lib/lattice/Lattice_transfer.h @@ -374,7 +374,7 @@ void InsertSlice(Lattice &lowDim,Lattice & higherDim,int slice, int assert(nl+1 == nh); assert(orthog=0); - assert(hg->_processors[orthog]==0); + assert(hg->_processors[orthog]==1); int dl; dl = 0; for(int d=0;d &lowDim, Lattice & higherDim,int slice, in assert(nl+1 == nh); assert(orthog=0); - assert(hg->_processors[orthog]==0); + assert(hg->_processors[orthog]==1); int dl; dl = 0; for(int d=0;d Date: Thu, 12 May 2016 19:24:10 +0100 Subject: [PATCH 7/7] fix of the empty SIMD --- lib/simd/Grid_empty.h | 50 ++++++++++++++++++++++++++++++++++++++++++- 1 file changed, 49 insertions(+), 1 deletion(-) diff --git a/lib/simd/Grid_empty.h b/lib/simd/Grid_empty.h index 5ab75de7..46082130 100644 --- a/lib/simd/Grid_empty.h +++ b/lib/simd/Grid_empty.h @@ -377,7 +377,55 @@ namespace Optimization { template < typename vtype > void permute(vtype &a, vtype b, int perm) { - }; + }; + + struct Rotate{ + + static inline u128f rotate(u128f in,int n){ + u128f out; + switch(n){ + case 0: + out.f[0] = in.f[0]; + out.f[1] = in.f[1]; + out.f[2] = in.f[2]; + out.f[3] = in.f[3]; + break; + case 1: + out.f[0] = in.f[1]; + out.f[1] = in.f[2]; + out.f[2] = in.f[3]; + out.f[3] = in.f[0]; + break; + case 2: + out.f[0] = in.f[2]; + out.f[1] = in.f[3]; + out.f[2] = in.f[0]; + out.f[3] = in.f[1]; + break; + case 3: + out.f[0] = in.f[3]; + out.f[1] = in.f[0]; + out.f[2] = in.f[1]; + out.f[3] = in.f[2]; + break; + default: assert(0); + } + } + static inline u128d rotate(u128d in,int n){ + u128d out; + switch(n){ + case 0: + out.f[0] = in.f[0]; + out.f[1] = in.f[1]; + break; + case 1: + out.f[0] = in.f[1]; + out.f[1] = in.f[0]; + break; + default: assert(0); + } + } + }; //Complex float Reduce template<>