diff --git a/Grid/qcd/action/fermion/WilsonCompressor.h b/Grid/qcd/action/fermion/WilsonCompressor.h index 605bdcec..1c6571e1 100644 --- a/Grid/qcd/action/fermion/WilsonCompressor.h +++ b/Grid/qcd/action/fermion/WilsonCompressor.h @@ -484,6 +484,12 @@ public: this->face_table_computed=1; assert(this->u_comm_offset==this->_unified_buffer_size); accelerator_barrier(); +#ifdef NVLINK_GET + #warning "NVLINK_GET" + this->_grid->StencilBarrier(); // He can now get mu local gather, I can get his + // Synch shared memory on a single nodes; could use an asynchronous barrier here and defer check + // Or issue barrier AFTER the DMA is running +#endif } };