1
0
mirror of https://github.com/paboyle/Grid.git synced 2025-12-21 21:24:30 +00:00

Hand unrolled version of dslash in a separate class.

Useful to compare; raises Intel compiler from 9GFlop/s to 17.5 Gflops.
                   on ivybridge core. Raises Clang form 14.5 to 17.5
This commit is contained in:
Peter Boyle
2015-05-26 19:54:03 +01:00
parent c2ffb1a098
commit 20100d0a40
9 changed files with 157 additions and 370 deletions

View File

@@ -3,16 +3,11 @@
namespace Grid {
template<class obj1,class obj2>
void conformable(const Lattice<obj1> &lhs,const Lattice<obj2> &rhs)
template<class obj1,class obj2> void conformable(const Lattice<obj1> &lhs,const Lattice<obj2> &rhs)
{
assert(lhs._grid == rhs._grid);
assert(lhs.checkerboard == rhs.checkerboard);
}
void inline conformable(const GridBase *lhs,GridBase *rhs)
{
assert(lhs == rhs);
}
}
#endif