fix minor CUDA NB kernel performance regression

author Szilard Pall <pall.szilard@gmail.com>

Wed, 17 Jun 2015 22:59:57 +0000 (00:59 +0200)

committer Szilard Pall <pall.szilard@gmail.com>

Wed, 17 Jun 2015 23:11:04 +0000 (01:11 +0200)
author Szilard Pall <pall.szilard@gmail.com>
Wed, 17 Jun 2015 22:59:57 +0000 (00:59 +0200)
committer Szilard Pall <pall.szilard@gmail.com>
Wed, 17 Jun 2015 23:11:04 +0000 (01:11 +0200)
diff --git a/src/gromacs/mdlib/nbnxn_cuda/nbnxn_cuda_kernel.cuh b/src/gromacs/mdlib/nbnxn_cuda/nbnxn_cuda_kernel.cuh

index ef6fad72c1c55812c466f94ac10d67e4390afa64..b24915c1f922cefed0f1f0b9b48969e74c167600 100644 (file)
--- a/src/gromacs/mdlib/nbnxn_cuda/nbnxn_cuda_kernel.cuh
+++ b/src/gromacs/mdlib/nbnxn_cuda/nbnxn_cuda_kernel.cuh
@@ -160,7 +160,11 @@ __global__ void NB_KERNEL_FUNC_NAME(nbnxn_kernel, _F_cuda)
      unsigned int tidxi  = threadIdx.x;
      unsigned int tidxj  = threadIdx.y;
      unsigned int tidx   = threadIdx.y * blockDim.x + threadIdx.x;
+#if NTHREAD_Z == 1
+    unsigned int tidxz  = 0;
+#else
      unsigned int tidxz  = threadIdx.z;
+#endif
      unsigned int bidx   = blockIdx.x;
      unsigned int widx   = tidx / WARP_SIZE; /* warp index */
author	Szilard Pall <pall.szilard@gmail.com>
	Wed, 17 Jun 2015 22:59:57 +0000 (00:59 +0200)
committer	Szilard Pall <pall.szilard@gmail.com>
	Wed, 17 Jun 2015 23:11:04 +0000 (01:11 +0200)