mirror of
https://github.com/paboyle/Grid.git
synced 2024-11-09 23:45:36 +00:00
sliceSumReduction_cub_large now also faster than CPU on Frontier
This commit is contained in:
parent
e0d5e3c6c7
commit
15878f7613
@ -119,7 +119,7 @@ template<class vobj> inline void sliceSumReduction_cub_large(const vobj *Data, V
|
||||
typedef typename vobj::vector_type vector;
|
||||
const int words = sizeof(vobj)/sizeof(vector);
|
||||
const int osites = rd*e1*e2;
|
||||
Vector<vector>buffer(osites);
|
||||
commVector<vector>buffer(osites);
|
||||
vector *dat = (vector *)Data;
|
||||
vector *buf = &buffer[0];
|
||||
Vector<vector> lvSum_small(rd);
|
||||
|
@ -105,6 +105,8 @@ int main (int argc, char ** argv) {
|
||||
|
||||
int trace_id = traceStart("sliceSum benchmark - ComplexD");
|
||||
std::cout << GridLogMessage << "Testing ComplexD" << std::endl;
|
||||
std::cout << GridLogMessage << "sizeof(ComplexD) = " << sizeof(ComplexD) << std::endl;
|
||||
std::cout << GridLogMessage << "sizeof(vComplexD) = " << sizeof(vComplexD) << std::endl;
|
||||
for (int i = 0; i < Nd; i++) {
|
||||
|
||||
RealD t=-usecond();
|
||||
@ -258,4 +260,4 @@ int main (int argc, char ** argv) {
|
||||
|
||||
Grid_finalize();
|
||||
return 0;
|
||||
}
|
||||
}
|
||||
|
Loading…
Reference in New Issue
Block a user