Fix CUDA inter-stream synchronization issue

[alexxy/gromacs.git] / src / mdlib / nbnxn_cuda / nbnxn_cuda_types.h
diff --git a/src/mdlib/nbnxn_cuda/nbnxn_cuda_types.h b/src/mdlib/nbnxn_cuda/nbnxn_cuda_types.h

index 53cebe4f258aabcb20322461205e6ef2ed013baf..a5cbdc094677d2c085e4237e0760bc649c0c7aef 100644 (file)
--- a/src/mdlib/nbnxn_cuda/nbnxn_cuda_types.h
+++ b/src/mdlib/nbnxn_cuda/nbnxn_cuda_types.h
@@ -199,7 +199,7 @@ struct nbnxn_cuda
      cudaStream_t     stream[2];      /* local and non-local GPU streams                      */
  
      /* events used for synchronization */
-    cudaEvent_t    nonlocal_done, misc_ops_done;
+    cudaEvent_t    nonlocal_done, misc_ops_and_local_H2D_done;
  
      /* NOTE: With current CUDA versions (<=5.0) timing doesn't work with multiple
       * concurrent streams, so we won't time if both l/nl work is done on GPUs.