diff --git a/Grid/algorithms/iterative/ConjugateGradient.h b/Grid/algorithms/iterative/ConjugateGradient.h index e0fa7f83..3308d8fe 100644 --- a/Grid/algorithms/iterative/ConjugateGradient.h +++ b/Grid/algorithms/iterative/ConjugateGradient.h @@ -191,7 +191,7 @@ public: std::cout << GridLogMessage << "\tAxpyNorm " << AxpyNormTimer.Elapsed() < buffer(numBlocks); sobj *buffer_v = &buffer[0]; sobj result; - reduceKernel<<< numBlocks, numThreads, smemSize >>>(lat, buffer_v, size); + reduceKernel<<< numBlocks, numThreads, smemSize, computeStream >>>(lat, buffer_v, size); accelerator_barrier(); acceleratorCopyFromDevice(buffer_v,&result,sizeof(result)); #else Vector buffer(numBlocks); sobj *buffer_v = &buffer[0]; sobj result; - reduceKernel<<< numBlocks, numThreads, smemSize >>>(lat, buffer_v, size); + reduceKernel<<< numBlocks, numThreads, smemSize, computeStream >>>(lat, buffer_v, size); accelerator_barrier(); result = *buffer_v; #endif