From 5e48b701ecaa6e9cf184841f0c79aeaf4def1237 Mon Sep 17 00:00:00 2001 From: paboyle Date: Sat, 13 Jan 2018 00:11:53 +0000 Subject: [PATCH] FOrmatting --- lib/stencil/Lebesgue.cc | 48 ++++++++++++------------- lib/stencil/Lebesgue.h | 72 ++++++++++++++++++------------------- lib/stencil/Stencil.cc | 30 ++++++++-------- lib/stencil/Stencil.h | 78 ++++++++++++++++++++--------------------- 4 files changed, 114 insertions(+), 114 deletions(-) diff --git a/lib/stencil/Lebesgue.cc b/lib/stencil/Lebesgue.cc index bd8ed3ad..c6d7369e 100644 --- a/lib/stencil/Lebesgue.cc +++ b/lib/stencil/Lebesgue.cc @@ -1,4 +1,4 @@ - /************************************************************************************* +/************************************************************************************* Grid physics library, www.github.com/paboyle/Grid @@ -24,8 +24,8 @@ Author: paboyle 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. See the full license in the file "LICENSE" in the top level distribution directory - *************************************************************************************/ - /* END LEGAL */ +*************************************************************************************/ +/* END LEGAL */ #include #include @@ -72,9 +72,9 @@ void LebesgueOrder::ThreadInterleave(void) for(int t=0;t> blockbits) % threads == t ) { - throrder.push_back(reorder[ss]); - } + if ( ( ss >> blockbits) % threads == t ) { + throrder.push_back(reorder[ss]); + } } } _LebesgueReorder = throrder; @@ -112,9 +112,9 @@ void LebesgueOrder::CartesianBlocking(void) }; void LebesgueOrder::IterateO(int ND,int dim, - std::vector & xo, - std::vector & xi, - std::vector &dims) + std::vector & xo, + std::vector & xi, + std::vector &dims) { for(xo[dim]=0;xo[dim] 0 ) { @@ -126,10 +126,10 @@ void LebesgueOrder::IterateO(int ND,int dim, }; void LebesgueOrder::IterateI(int ND, - int dim, - std::vector & xo, - std::vector & xi, - std::vector &dims) + int dim, + std::vector & xo, + std::vector & xi, + std::vector &dims) { std::vector x(ND); for(xi[dim]=0;xi[dim]_rdimensions); _LebesgueReorder.push_back(index); @@ -227,16 +227,16 @@ void LebesgueOrder::ZGraph(void) assert( _LebesgueReorder.size() == vol ); /* - std::vector coor(4); - for(IndexInteger asite=0;asite coor(4); + for(IndexInteger asite=0;asiteoCoorFromOindex (coor,_LebesgueReorder[asite]); - std::cout << " site "<" << _LebesgueReorder[asite]<< " = [" - << coor[0]<<"," - << coor[1]<<"," - << coor[2]<<"," - << coor[3]<<"]" - <" << _LebesgueReorder[asite]<< " = [" + << coor[0]<<"," + << coor[1]<<"," + << coor[2]<<"," + << coor[3]<<"]" + < 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. See the full license in the file "LICENSE" in the top level distribution directory - *************************************************************************************/ - /* END LEGAL */ +*************************************************************************************/ +/* END LEGAL */ #ifndef GRID_LEBESGUE_H #define GRID_LEBESGUE_H @@ -34,48 +34,48 @@ Author: paboyle // Lebesgue, Morton, Z-graph ordering assistance NAMESPACE_BEGIN(Grid); - class LebesgueOrder { - public: +class LebesgueOrder { +public: - typedef int32_t IndexInteger; + typedef int32_t IndexInteger; - static int UseLebesgueOrder; - GridBase *grid; + static int UseLebesgueOrder; + GridBase *grid; - public: - LebesgueOrder(GridBase *_grid); +public: + LebesgueOrder(GridBase *_grid); - inline IndexInteger Reorder(IndexInteger ss) { - return _LebesgueReorder[ss] ; - }; + inline IndexInteger Reorder(IndexInteger ss) { + return _LebesgueReorder[ss] ; + }; - //////////////////////////// - // Space filling fractal for cache oblivious - //////////////////////////// - void ZGraph(void); - IndexInteger alignup(IndexInteger n); + //////////////////////////// + // Space filling fractal for cache oblivious + //////////////////////////// + void ZGraph(void); + IndexInteger alignup(IndexInteger n); - ///////////////////////////////// - // Cartesian stencil blocking strategy - ///////////////////////////////// - static std::vector Block; - void NoBlocking(void); - void CartesianBlocking(void); - void IterateO(int ND,int dim, - std::vector & xo, - std::vector & xi, - std::vector &dims); - void IterateI(int ND,int dim, - std::vector & xo, - std::vector & xi, - std::vector &dims); + ///////////////////////////////// + // Cartesian stencil blocking strategy + ///////////////////////////////// + static std::vector Block; + void NoBlocking(void); + void CartesianBlocking(void); + void IterateO(int ND,int dim, + std::vector & xo, + std::vector & xi, + std::vector &dims); + void IterateI(int ND,int dim, + std::vector & xo, + std::vector & xi, + std::vector &dims); - void ThreadInterleave(void); + void ThreadInterleave(void); - private: - std::vector _LebesgueReorder; +private: + std::vector _LebesgueReorder; - }; +}; NAMESPACE_END(Grid); diff --git a/lib/stencil/Stencil.cc b/lib/stencil/Stencil.cc index 9cd6a9ab..c1b33baa 100644 --- a/lib/stencil/Stencil.cc +++ b/lib/stencil/Stencil.cc @@ -1,4 +1,4 @@ - /************************************************************************************* +/************************************************************************************* Grid physics library, www.github.com/paboyle/Grid @@ -23,14 +23,14 @@ 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. See the full license in the file "LICENSE" in the top level distribution directory - *************************************************************************************/ - /* END LEGAL */ +*************************************************************************************/ +/* END LEGAL */ #include NAMESPACE_BEGIN(Grid); void Gather_plane_table_compute (GridBase *grid,int dimension,int plane,int cbmask, - int off,std::vector > & table) + int off,std::vector > & table) { table.resize(0); @@ -52,17 +52,17 @@ void Gather_plane_table_compute (GridBase *grid,int dimension,int plane,int cbma } } } else { - int bo=0; - table.resize(e1*e2/2); - for(int n=0;nCheckerBoardFromOindexTable(o+b); - if ( ocb &cbmask ) { - table[bo]=std::pair(bo,o+b); bo++; - } - } - } + int bo=0; + table.resize(e1*e2/2); + for(int n=0;nCheckerBoardFromOindexTable(o+b); + if ( ocb &cbmask ) { + table[bo]=std::pair(bo,o+b); bo++; + } + } + } } } diff --git a/lib/stencil/Stencil.h b/lib/stencil/Stencil.h index ef35e100..aeadd4b9 100644 --- a/lib/stencil/Stencil.h +++ b/lib/stencil/Stencil.h @@ -23,30 +23,30 @@ 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. See the full license in the file "LICENSE" in the top level distribution directory - *************************************************************************************/ - /* END LEGAL */ +*************************************************************************************/ +/* END LEGAL */ #ifndef GRID_STENCIL_H #define GRID_STENCIL_H #include // subdir aggregate #include // subdir aggregate - ////////////////////////////////////////////////////////////////////////////////////////// - // Must not lose sight that goal is to be able to construct really efficient - // gather to a point stencil code. CSHIFT is not the best way, so need - // additional stencil support. - // - // Stencil based code will exchange haloes and use a table lookup for neighbours. - // This will be done with generality to allow easier efficient implementations. - // Overlap of comms and compute is enabled by tabulating off-node connected, - // - // Generic services - // 0) Prebuild neighbour tables - // 1) Compute sizes of all haloes/comms buffers; allocate them. - // 2) Gather all faces, and communicate. - // 3) Loop over result sites, giving nbr index/offnode info for each - // - ////////////////////////////////////////////////////////////////////////////////////////// +////////////////////////////////////////////////////////////////////////////////////////// +// Must not lose sight that goal is to be able to construct really efficient +// gather to a point stencil code. CSHIFT is not the best way, so need +// additional stencil support. +// +// Stencil based code will exchange haloes and use a table lookup for neighbours. +// This will be done with generality to allow easier efficient implementations. +// Overlap of comms and compute is enabled by tabulating off-node connected, +// +// Generic services +// 0) Prebuild neighbour tables +// 1) Compute sizes of all haloes/comms buffers; allocate them. +// 2) Gather all faces, and communicate. +// 3) Loop over result sites, giving nbr index/offnode info for each +// +////////////////////////////////////////////////////////////////////////////////////////// NAMESPACE_BEGIN(Grid); @@ -54,7 +54,7 @@ NAMESPACE_BEGIN(Grid); // Gather for when there *is* need to SIMD split with compression /////////////////////////////////////////////////////////////////// void Gather_plane_table_compute (GridBase *grid,int dimension,int plane,int cbmask, - int off,std::vector > & table); + int off,std::vector > & table); template void Gather_plane_simple_table (std::vector >& table,const Lattice &rhs,cobj *buffer,compressor &compress, int off,int so) __attribute__((noinline)); @@ -89,21 +89,21 @@ void Gather_plane_exchange_table(std::vector >& table,const L } } - struct StencilEntry { - uint64_t _offset; - uint64_t _byte_offset; - uint16_t _is_local; - uint16_t _permute; - uint16_t _around_the_world; //256 bits, 32 bytes, 1/2 cacheline - uint16_t _pad; - }; +struct StencilEntry { + uint64_t _offset; + uint64_t _byte_offset; + uint16_t _is_local; + uint16_t _permute; + uint16_t _around_the_world; //256 bits, 32 bytes, 1/2 cacheline + uint16_t _pad; +}; //////////////////////////////////////// // The Stencil Class itself //////////////////////////////////////// template class CartesianStencil { // Stencil runs along coordinate axes only; NO diagonal fill in. - public: +public: typedef typename cobj::vector_type vector_type; typedef typename cobj::scalar_type scalar_type; @@ -538,17 +538,17 @@ class CartesianStencil { // Stencil runs along coordinate axes only; NO diagonal } }; - CartesianStencil(GridBase *grid, - int npoints, - int checkerboard, - const std::vector &directions, - const std::vector &distances) - : _permute_type(npoints), - _comm_buf_size(npoints), - comm_bytes_thr(npoints), - comm_enter_thr(npoints), - comm_leave_thr(npoints), - comm_time_thr(npoints) + CartesianStencil(GridBase *grid, + int npoints, + int checkerboard, + const std::vector &directions, + const std::vector &distances) + : _permute_type(npoints), + _comm_buf_size(npoints), + comm_bytes_thr(npoints), + comm_enter_thr(npoints), + comm_leave_thr(npoints), + comm_time_thr(npoints) { face_table_computed=0; _npoints = npoints;