From 6fdefe5b90de26529b3bdbd3c0820a09fd7a0a0f Mon Sep 17 00:00:00 2001 From: Peter Boyle Date: Wed, 12 Feb 2025 14:55:20 +0000 Subject: [PATCH] Barrier sequencing if doing "GET" not "PUT" is different. This is somewhat better timing for Barriers --- Grid/qcd/action/fermion/WilsonCompressor.h | 6 ++++++ 1 file changed, 6 insertions(+) diff --git a/Grid/qcd/action/fermion/WilsonCompressor.h b/Grid/qcd/action/fermion/WilsonCompressor.h index 605bdcec..1c6571e1 100644 --- a/Grid/qcd/action/fermion/WilsonCompressor.h +++ b/Grid/qcd/action/fermion/WilsonCompressor.h @@ -484,6 +484,12 @@ public: this->face_table_computed=1; assert(this->u_comm_offset==this->_unified_buffer_size); accelerator_barrier(); +#ifdef NVLINK_GET + #warning "NVLINK_GET" + this->_grid->StencilBarrier(); // He can now get mu local gather, I can get his + // Synch shared memory on a single nodes; could use an asynchronous barrier here and defer check + // Or issue barrier AFTER the DMA is running +#endif } };