Apply clang-tidy-11 fixes to CUDA files

[alexxy/gromacs.git] / src / gromacs / ewald / pme_solve.cu
diff --git a/src/gromacs/ewald/pme_solve.cu b/src/gromacs/ewald/pme_solve.cu

index 3f5d2d06f45b5a0121562c1d69ef6b1d99258535..83e21b1f118a2e09dd2b31267c92ce978bc85b75 100644 (file)
--- a/src/gromacs/ewald/pme_solve.cu
+++ b/src/gromacs/ewald/pme_solve.cu
@@ -1,7 +1,7 @@
  /*
   * This file is part of the GROMACS molecular simulation package.
   *
- * Copyright (c) 2016,2017,2018,2019,2020, by the GROMACS development team, led by
+ * Copyright (c) 2016,2017,2018,2019,2020,2021, by the GROMACS development team, led by
   * Mark Abraham, David van der Spoel, Berk Hess, and Erik Lindahl,
   * and including many others, as listed in the AUTHORS file in the
   * top-level source directory and at http://www.gromacs.org.
@@ -88,7 +88,7 @@ __launch_bounds__(c_solveMaxThreadsPerBlock) CLANG_DISABLE_OPTIMIZATION_ATTRIBUT
      const float* __restrict__ gm_splineValueMinor = kernelParams.grid.d_splineModuli[gridIndex]
                                                      + kernelParams.grid.splineValuesOffset[minorDim];
      float* __restrict__ gm_virialAndEnergy = kernelParams.constants.d_virialAndEnergy[gridIndex];
-    float2* __restrict__ gm_grid           = (float2*)kernelParams.grid.d_fourierGrid[gridIndex];
+    float2* __restrict__ gm_grid = reinterpret_cast<float2*>(kernelParams.grid.d_fourierGrid[gridIndex]);
  
      /* Various grid sizes and indices */
      const int localOffsetMinor = 0, localOffsetMajor = 0, localOffsetMiddle = 0; // unused
@@ -119,13 +119,13 @@ __launch_bounds__(c_solveMaxThreadsPerBlock) CLANG_DISABLE_OPTIMIZATION_ATTRIBUT
      const int indexMajor        = blockIdx.z;
  
      /* Optional outputs */
-    float energy = 0.0f;
-    float virxx  = 0.0f;
-    float virxy  = 0.0f;
-    float virxz  = 0.0f;
-    float viryy  = 0.0f;
-    float viryz  = 0.0f;
-    float virzz  = 0.0f;
+    float energy = 0.0F;
+    float virxx  = 0.0F;
+    float virxy  = 0.0F;
+    float virxz  = 0.0F;
+    float viryy  = 0.0F;
+    float viryz  = 0.0F;
+    float virzz  = 0.0F;
  
      assert(indexMajor < kernelParams.grid.complexGridSize[majorDim]);
      if ((indexMiddle < localCountMiddle) & (indexMinor < localCountMinor)
@@ -176,20 +176,20 @@ __launch_bounds__(c_solveMaxThreadsPerBlock) CLANG_DISABLE_OPTIMIZATION_ATTRIBUT
          }
  
          /* 0.5 correction factor for the first and last components of a Z dimension */
-        float corner_fac = 1.0f;
+        float corner_fac = 1.0F;
          switch (gridOrdering)
          {
              case GridOrdering::YZX:
                  if ((kMiddle == 0) | (kMiddle == maxkMiddle))
                  {
-                    corner_fac = 0.5f;
+                    corner_fac = 0.5F;
                  }
                  break;
  
              case GridOrdering::XYZ:
                  if ((kMinor == 0) | (kMinor == maxkMinor))
                  {
-                    corner_fac = 0.5f;
+                    corner_fac = 0.5F;
                  }
                  break;
  
@@ -206,13 +206,13 @@ __launch_bounds__(c_solveMaxThreadsPerBlock) CLANG_DISABLE_OPTIMIZATION_ATTRIBUT
                                 + mZ * kernelParams.current.recipBox[ZZ][ZZ];
  
              const float m2k = mhxk * mhxk + mhyk * mhyk + mhzk * mhzk;
-            assert(m2k != 0.0f);
+            assert(m2k != 0.0F);
              // TODO: use LDG/textures for gm_splineValue
              float denom = m2k * float(CUDART_PI_F) * kernelParams.current.boxVolume
                            * gm_splineValueMajor[kMajor] * gm_splineValueMiddle[kMiddle]
                            * gm_splineValueMinor[kMinor];
              assert(isfinite(denom));
-            assert(denom != 0.0f);
+            assert(denom != 0.0F);
  
              const float tmp1   = expf(-kernelParams.grid.ewaldFactor * m2k);
              const float etermk = kernelParams.constants.elFactor * tmp1 / denom;
@@ -226,9 +226,9 @@ __launch_bounds__(c_solveMaxThreadsPerBlock) CLANG_DISABLE_OPTIMIZATION_ATTRIBUT
              if (computeEnergyAndVirial)
              {
                  const float tmp1k =
-                        2.0f * (gridValue.x * oldGridValue.x + gridValue.y * oldGridValue.y);
+                        2.0F * (gridValue.x * oldGridValue.x + gridValue.y * oldGridValue.y);
  
-                float vfactor = (kernelParams.grid.ewaldFactor + 1.0f / m2k) * 2.0f;
+                float vfactor = (kernelParams.grid.ewaldFactor + 1.0F / m2k) * 2.0F;
                  float ets2    = corner_fac * tmp1k;
                  energy        = ets2;
  
@@ -303,7 +303,7 @@ __launch_bounds__(c_solveMaxThreadsPerBlock) CLANG_DISABLE_OPTIMIZATION_ATTRIBUT
          /* Reduce 7 outputs per warp in the shared memory */
          const int stride =
                  8; // this is c_virialAndEnergyCount==7 rounded up to power of 2 for convenience, hence the assert
-        assert(c_virialAndEnergyCount == 7);
+        static_assert(c_virialAndEnergyCount == 7);
          const int        reductionBufferSize = (c_solveMaxThreadsPerBlock / warp_size) * stride;
          __shared__ float sm_virialAndEnergy[reductionBufferSize];