Clean up index handing in make_bondeds_zone

[alexxy/gromacs.git] / src / gromacs / domdec / partition.cpp
diff --git a/src/gromacs/domdec/partition.cpp b/src/gromacs/domdec/partition.cpp

index 15a3a8809c18e6c796bf471658b8315d25cf5846..473ab3f92682470a1dbb7ed12a217727a1894a03 100644 (file)
--- a/src/gromacs/domdec/partition.cpp
+++ b/src/gromacs/domdec/partition.cpp
@@ -1,7 +1,7 @@
  /*
   * This file is part of the GROMACS molecular simulation package.
   *
- * Copyright (c) 2018,2019, by the GROMACS development team, led by
+ * Copyright (c) 2018,2019,2020,2021, by the GROMACS development team, led by
   * Mark Abraham, David van der Spoel, Berk Hess, and Erik Lindahl,
   * and including many others, as listed in the AUTHORS file in the
   * top-level source directory and at http://www.gromacs.org.
@@ -43,6 +43,7 @@
  
  #include "gmxpre.h"
  
+#include "gromacs/utility/arrayref.h"
  #include "partition.h"
  
  #include "config.h"
@@ -55,13 +56,14 @@
  #include "gromacs/domdec/collect.h"
  #include "gromacs/domdec/dlb.h"
  #include "gromacs/domdec/dlbtiming.h"
-#include "gromacs/domdec/domdec.h"
  #include "gromacs/domdec/domdec_network.h"
  #include "gromacs/domdec/ga2la.h"
  #include "gromacs/domdec/localatomsetmanager.h"
+#include "gromacs/domdec/localtopology.h"
+#include "gromacs/domdec/localtopologychecker.h"
  #include "gromacs/domdec/mdsetup.h"
-#include "gromacs/ewald/pme.h"
-#include "gromacs/gmxlib/chargegroup.h"
+#include "gromacs/domdec/nsgrid.h"
+#include "gromacs/ewald/pme_pp.h"
  #include "gromacs/gmxlib/network.h"
  #include "gromacs/gmxlib/nrnb.h"
  #include "gromacs/imd/imd.h"
@@ -70,12 +72,12 @@
  #include "gromacs/mdlib/forcerec.h"
  #include "gromacs/mdlib/gmx_omp_nthreads.h"
  #include "gromacs/mdlib/mdatoms.h"
-#include "gromacs/mdlib/nsgrid.h"
  #include "gromacs/mdlib/vsite.h"
  #include "gromacs/mdtypes/commrec.h"
  #include "gromacs/mdtypes/forcerec.h"
  #include "gromacs/mdtypes/inputrec.h"
  #include "gromacs/mdtypes/md_enums.h"
+#include "gromacs/mdtypes/mdatom.h"
  #include "gromacs/mdtypes/nblist.h"
  #include "gromacs/mdtypes/state.h"
  #include "gromacs/nbnxm/nbnxm.h"
@@ -108,20 +110,27 @@
   * There is a bit of overhead with DLB and it's difficult to achieve
   * a load imbalance of less than 2% with DLB.
   */
-#define DD_PERF_LOSS_DLB_ON  0.02
+#define DD_PERF_LOSS_DLB_ON 0.02
  
  //! Warn about imbalance due to PP or PP/PME load imbalance at this loss.
-#define DD_PERF_LOSS_WARN    0.05
+#define DD_PERF_LOSS_WARN 0.05
  
  
  //! Debug helper printing a DD zone
-static void print_ddzone(FILE *fp, int d, int i, int j, gmx_ddzone_t *zone)
+static void print_ddzone(FILE* fp, int d, int i, int j, gmx_ddzone_t* zone)
  {
-    fprintf(fp, "zone d0 %d d1 %d d2 %d  min0 %6.3f max1 %6.3f mch0 %6.3f mch1 %6.3f p1_0 %6.3f p1_1 %6.3f\n",
-            d, i, j,
-            zone->min0, zone->max1,
-            zone->mch0, zone->mch0,
-            zone->p1_0, zone->p1_1);
+    fprintf(fp,
+            "zone d0 %d d1 %d d2 %d  min0 %6.3f max1 %6.3f mch0 %6.3f mch1 %6.3f p1_0 %6.3f p1_1 "
+            "%6.3f\n",
+            d,
+            i,
+            j,
+            zone->min0,
+            zone->max1,
+            zone->mch0,
+            zone->mch0,
+            zone->p1_0,
+            zone->p1_1);
  }
  
  /*! \brief Using the home grid size as input in cell_ns_x0 and cell_ns_x1
@@ -129,23 +138,20 @@ static void print_ddzone(FILE *fp, int d, int i, int j, gmx_ddzone_t *zone)
   * and returns the results in cell_ns_x0 and cell_ns_x1.
   * Note: only used with the group cut-off scheme.
   */
-static void dd_move_cellx(gmx_domdec_t      *dd,
-                          const gmx_ddbox_t *ddbox,
-                          rvec               cell_ns_x0,
-                          rvec               cell_ns_x1)
+static void dd_move_cellx(gmx_domdec_t* dd, const gmx_ddbox_t* ddbox, rvec cell_ns_x0, rvec cell_ns_x1)
  {
      constexpr int      c_ddZoneCommMaxNumZones = 5;
      gmx_ddzone_t       buf_s[c_ddZoneCommMaxNumZones];
      gmx_ddzone_t       buf_r[c_ddZoneCommMaxNumZones];
      gmx_ddzone_t       buf_e[c_ddZoneCommMaxNumZones];
-    gmx_domdec_comm_t *comm = dd->comm;
+    gmx_domdec_comm_t* comm = dd->comm;
  
-    rvec               extr_s[2];
-    rvec               extr_r[2];
+    rvec extr_s[2];
+    rvec extr_r[2];
      for (int d = 1; d < dd->ndim; d++)
      {
          int           dim = dd->dim[d];
-        gmx_ddzone_t &zp  = (d == 1) ? comm->zone_d1[0] : comm->zone_d2[0][0];
+        gmx_ddzone_t& zp  = (d == 1) ? comm->zone_d1[0] : comm->zone_d2[0][0];
  
          /* Copy the base sizes of the home zone */
          zp.min0    = cell_ns_x0[dim];
@@ -178,16 +184,16 @@ static void dd_move_cellx(gmx_domdec_t      *dd,
          /* Store the extremes in the backward sending buffer,
           * so they get updated separately from the forward communication.
           */
-        for (int d1 = d; d1 < dd->ndim-1; d1++)
+        for (int d1 = d; d1 < dd->ndim - 1; d1++)
          {
-            gmx_ddzone_t &buf = buf_s[pos];
+            gmx_ddzone_t& buf = buf_s[pos];
  
              /* We invert the order to be able to use the same loop for buf_e */
-            buf.min0    = extr_s[d1][1];
-            buf.max1    = extr_s[d1][0];
-            buf.min1    = extr_s[d1][2];
-            buf.mch0    = 0;
-            buf.mch1    = 0;
+            buf.min0 = extr_s[d1][1];
+            buf.max1 = extr_s[d1][0];
+            buf.min1 = extr_s[d1][2];
+            buf.mch0 = 0;
+            buf.mch1 = 0;
              /* Store the cell corner of the dimension we communicate along */
              buf.p1_0    = comm->cell_x0[dim];
              buf.p1_1    = 0;
@@ -214,7 +220,7 @@ static void dd_move_cellx(gmx_domdec_t      *dd,
          if (applyPbc)
          {
              /* Take the minimum to avoid double communication */
-            numPulsesMin = std::min(numPulses, dd->nc[dim] - 1 - numPulses);
+            numPulsesMin = std::min(numPulses, dd->numCells[dim] - 1 - numPulses);
          }
          else
          {
@@ -230,10 +236,8 @@ static void dd_move_cellx(gmx_domdec_t      *dd,
              /* Communicate the extremes forward */
              bool receiveValidData = (applyPbc || dd->ci[dim] > 0);
  
-            int  numElements      = dd->ndim - d - 1;
-            ddSendrecv(dd, d, dddirForward,
-                       extr_s + d, numElements,
-                       extr_r + d, numElements);
+            int numElements = dd->ndim - d - 1;
+            ddSendrecv(dd, d, dddirForward, extr_s + d, numElements, extr_r + d, numElements);
  
              if (receiveValidData)
              {
@@ -250,12 +254,16 @@ static void dd_move_cellx(gmx_domdec_t      *dd,
          for (int pulse = 0; pulse < numPulses; pulse++)
          {
              /* Communicate all the zone information backward */
-            bool receiveValidData = (applyPbc || dd->ci[dim] < dd->nc[dim] - 1);
+            bool receiveValidData = (applyPbc || dd->ci[dim] < dd->numCells[dim] - 1);
  
-            static_assert(sizeof(gmx_ddzone_t) == c_ddzoneNumReals*sizeof(real), "Here we expect gmx_ddzone_t to consist of c_ddzoneNumReals reals (only)");
+            static_assert(
+                    sizeof(gmx_ddzone_t) == c_ddzoneNumReals * sizeof(real),
+                    "Here we expect gmx_ddzone_t to consist of c_ddzoneNumReals reals (only)");
  
-            int numReals = numElementsInBuffer*c_ddzoneNumReals;
-            ddSendrecv(dd, d, dddirBackward,
+            int numReals = numElementsInBuffer * c_ddzoneNumReals;
+            ddSendrecv(dd,
+                       d,
+                       dddirBackward,
                         gmx::arrayRefFromArray(&buf_s[0].min0, numReals),
                         gmx::arrayRefFromArray(&buf_r[0].min0, numReals));
  
@@ -282,10 +290,10 @@ static void dd_move_cellx(gmx_domdec_t      *dd,
                      {
                          c = 0;
                      }
-                    real det = (1 + c*c)*gmx::square(comm->systemInfo.cutoff) - dist_d*dist_d;
+                    real det = (1 + c * c) * gmx::square(comm->systemInfo.cutoff) - dist_d * dist_d;
                      if (det > 0)
                      {
-                        dh[d1] = comm->systemInfo.cutoff - (c*dist_d + std::sqrt(det))/(1 + c*c);
+                        dh[d1] = comm->systemInfo.cutoff - (c * dist_d + std::sqrt(det)) / (1 + c * c);
                      }
                      else
                      {
@@ -322,8 +330,8 @@ static void dd_move_cellx(gmx_domdec_t      *dd,
                      }
                      if (receiveValidData && dh[d1] >= 0)
                      {
-                        buf_e[i].mch0 = std::max(buf_e[i].mch0, buf_r[i].mch0-dh[d1]);
-                        buf_e[i].mch1 = std::max(buf_e[i].mch1, buf_r[i].mch1-dh[d1]);
+                        buf_e[i].mch0 = std::max(buf_e[i].mch0, buf_r[i].mch0 - dh[d1]);
+                        buf_e[i].mch1 = std::max(buf_e[i].mch1, buf_r[i].mch1 - dh[d1]);
                      }
                  }
                  /* Copy the received buffer to the send buffer,
@@ -331,13 +339,13 @@ static void dd_move_cellx(gmx_domdec_t      *dd,
                   */
                  buf_s[i] = buf_r[i];
              }
-            if (((applyPbc || dd->ci[dim] + numPulses < dd->nc[dim]) && pulse == numPulses - 1) ||
-                (!applyPbc && dd->ci[dim] + 1 + pulse == dd->nc[dim] - 1))
+            if (((applyPbc || dd->ci[dim] + numPulses < dd->numCells[dim]) && pulse == numPulses - 1)
+                || (!applyPbc && dd->ci[dim] + 1 + pulse == dd->numCells[dim] - 1))
              {
                  /* Store the extremes */
                  int pos = 0;
  
-                for (int d1 = d; d1 < dd->ndim-1; d1++)
+                for (int d1 = d; d1 < dd->ndim - 1; d1++)
                  {
                      extr_s[d1][1] = std::min(extr_s[d1][1], buf_e[pos].min0);
                      extr_s[d1][0] = std::max(extr_s[d1][0], buf_e[pos].max1);
@@ -349,7 +357,7 @@ static void dd_move_cellx(gmx_domdec_t      *dd,
                  {
                      for (int i = d; i < 2; i++)
                      {
-                        comm->zone_d2[1-d][i] = buf_e[pos];
+                        comm->zone_d2[1 - d][i] = buf_e[pos];
                          pos++;
                      }
                  }
@@ -413,40 +421,42 @@ static void dd_move_cellx(gmx_domdec_t      *dd,
      }
      for (int d = 1; d < dd->ndim; d++)
      {
-        cellsizes[d].fracLowerMax = extr_s[d-1][0];
-        cellsizes[d].fracUpperMin = extr_s[d-1][1];
+        cellsizes[d].fracLowerMax = extr_s[d - 1][0];
+        cellsizes[d].fracUpperMin = extr_s[d - 1][1];
          if (debug)
          {
-            fprintf(debug, "Cell fraction d %d, max0 %f, min1 %f\n",
-                    d, cellsizes[d].fracLowerMax, cellsizes[d].fracUpperMin);
+            fprintf(debug,
+                    "Cell fraction d %d, max0 %f, min1 %f\n",
+                    d,
+                    cellsizes[d].fracLowerMax,
+                    cellsizes[d].fracUpperMin);
          }
      }
  }
  
  //! Sets the charge-group zones to be equal to the home zone.
-static void set_zones_ncg_home(gmx_domdec_t *dd)
+static void set_zones_numHomeAtoms(gmx_domdec_t* dd)
  {
-    gmx_domdec_zones_t *zones;
+    gmx_domdec_zones_t* zones;
      int                 i;
  
      zones = &dd->comm->zones;
  
      zones->cg_range[0] = 0;
-    for (i = 1; i < zones->n+1; i++)
+    for (i = 1; i < zones->n + 1; i++)
      {
-        zones->cg_range[i] = dd->ncg_home;
+        zones->cg_range[i] = dd->numHomeAtoms;
      }
-    /* zone_ncg1[0] should always be equal to ncg_home */
-    dd->comm->zone_ncg1[0] = dd->ncg_home;
+    /* zone_ncg1[0] should always be equal to numHomeAtoms */
+    dd->comm->zone_ncg1[0] = dd->numHomeAtoms;
  }
  
  //! Restore atom groups for the charge groups.
-static void restoreAtomGroups(gmx_domdec_t  *dd,
-                              const t_state *state)
+static void restoreAtomGroups(gmx_domdec_t* dd, const t_state* state)
  {
-    gmx::ArrayRef<const int>  atomGroupsState        = state->cg_gl;
+    gmx::ArrayRef<const int> atomGroupsState = state->cg_gl;
  
-    std::vector<int>         &globalAtomGroupIndices = dd->globalAtomGroupIndices;
+    std::vector<int>& globalAtomGroupIndices = dd->globalAtomGroupIndices;
  
      globalAtomGroupIndices.resize(atomGroupsState.size());
  
@@ -458,49 +468,40 @@ static void restoreAtomGroups(gmx_domdec_t  *dd,
          globalAtomGroupIndices[i] = atomGroupsState[i];
      }
  
-    dd->ncg_home = atomGroupsState.size();
+    dd->numHomeAtoms = atomGroupsState.size();
      dd->comm->atomRanges.setEnd(DDAtomRanges::Type::Home, atomGroupsState.ssize());
  
-    set_zones_ncg_home(dd);
+    set_zones_numHomeAtoms(dd);
  }
  
-//! Sets the cginfo structures.
-static void dd_set_cginfo(gmx::ArrayRef<const int> index_gl, int cg0, int cg1,
-                          t_forcerec *fr, char *bLocalCG)
+//! Sets the atom info structures.
+static void dd_set_atominfo(gmx::ArrayRef<const int> index_gl, int cg0, int cg1, t_forcerec* fr)
  {
      if (fr != nullptr)
      {
-        const cginfo_mb_t *cginfo_mb = fr->cginfo_mb;
-        gmx::ArrayRef<int> cginfo    = fr->cginfo;
-
-        for (int cg = cg0; cg < cg1; cg++)
-        {
-            cginfo[cg] = ddcginfo(cginfo_mb, index_gl[cg]);
-        }
-    }
+        gmx::ArrayRef<gmx::AtomInfoWithinMoleculeBlock> atomInfoForEachMoleculeBlock =
+                fr->atomInfoForEachMoleculeBlock;
+        gmx::ArrayRef<int64_t> atomInfo = fr->atomInfo;
  
-    if (bLocalCG != nullptr)
-    {
          for (int cg = cg0; cg < cg1; cg++)
          {
-            bLocalCG[index_gl[cg]] = TRUE;
+            atomInfo[cg] = ddGetAtomInfo(atomInfoForEachMoleculeBlock, index_gl[cg]);
          }
      }
  }
  
  //! Makes the mappings between global and local atom indices during DD repartioning.
-static void make_dd_indices(gmx_domdec_t *dd,
-                            const int     atomStart)
+static void make_dd_indices(gmx_domdec_t* dd, const int atomStart)
  {
-    const int                 numZones               = dd->comm->zones.n;
-    const int                *zone2cg                = dd->comm->zones.cg_range;
-    const int                *zone_ncg1              = dd->comm->zone_ncg1;
-    gmx::ArrayRef<const int>  globalAtomGroupIndices = dd->globalAtomGroupIndices;
+    const int                numZones               = dd->comm->zones.n;
+    gmx::ArrayRef<const int> zone2cg                = dd->comm->zones.cg_range;
+    gmx::ArrayRef<const int> zone_ncg1              = dd->comm->zone_ncg1;
+    gmx::ArrayRef<const int> globalAtomGroupIndices = dd->globalAtomGroupIndices;
  
-    std::vector<int>         &globalAtomIndices      = dd->globalAtomIndices;
-    gmx_ga2la_t              &ga2la                  = *dd->ga2la;
+    std::vector<int>& globalAtomIndices = dd->globalAtomIndices;
+    gmx_ga2la_t&      ga2la             = *dd->ga2la;
  
-    if (zone2cg[1] != dd->ncg_home)
+    if (zone2cg[1] != dd->numHomeAtoms)
      {
          gmx_incons("dd->ncg_zone is not up to date");
      }
@@ -519,7 +520,7 @@ static void make_dd_indices(gmx_domdec_t *dd,
          {
              cg0 = zone2cg[zone];
          }
-        int cg1    = zone2cg[zone+1];
+        int cg1    = zone2cg[zone + 1];
          int cg1_p1 = cg0 + zone_ncg1[zone];
  
          for (int cg = cg0; cg < cg1; cg++)
@@ -532,57 +533,20 @@ static void make_dd_indices(gmx_domdec_t *dd,
              }
              int cg_gl = globalAtomGroupIndices[cg];
              globalAtomIndices.push_back(cg_gl);
-            ga2la.insert(cg_gl, {a, zone1});
+            ga2la.insert(cg_gl, { a, zone1 });
              a++;
          }
      }
  }
  
-//! Checks the charge-group assignements.
-static int check_bLocalCG(gmx_domdec_t *dd, int ncg_sys, const char *bLocalCG,
-                          const char *where)
-{
-    int nerr = 0;
-    if (bLocalCG == nullptr)
-    {
-        return nerr;
-    }
-    for (size_t i = 0; i < dd->globalAtomGroupIndices.size(); i++)
-    {
-        if (!bLocalCG[dd->globalAtomGroupIndices[i]])
-        {
-            fprintf(stderr,
-                    "DD rank %d, %s: atom group %zu, global atom group %d is not marked in bLocalCG (ncg_home %d)\n", dd->rank, where, i + 1, dd->globalAtomGroupIndices[i] + 1, dd->ncg_home);
-            nerr++;
-        }
-    }
-    size_t ngl = 0;
-    for (int i = 0; i < ncg_sys; i++)
-    {
-        if (bLocalCG[i])
-        {
-            ngl++;
-        }
-    }
-    if (ngl != dd->globalAtomGroupIndices.size())
-    {
-        fprintf(stderr, "DD rank %d, %s: In bLocalCG %zu atom groups are marked as local, whereas there are %zu\n", dd->rank, where, ngl, dd->globalAtomGroupIndices.size());
-        nerr++;
-    }
-
-    return nerr;
-}
-
  //! Checks whether global and local atom indices are consistent.
-static void check_index_consistency(gmx_domdec_t *dd,
-                                    int natoms_sys, int ncg_sys,
-                                    const char *where)
+static void check_index_consistency(const gmx_domdec_t* dd, int natoms_sys, const char* where)
  {
-    int       nerr = 0;
+    int nerr = 0;
  
      const int numAtomsInZones = dd->comm->atomRanges.end(DDAtomRanges::Type::Zones);
  
-    if (dd->comm->DD_debug > 1)
+    if (dd->comm->ddSettings.DD_debug > 1)
      {
          std::vector<int> have(natoms_sys);
          for (int a = 0; a < numAtomsInZones; a++)
@@ -590,7 +554,12 @@ static void check_index_consistency(gmx_domdec_t *dd,
              int globalAtomIndex = dd->globalAtomIndices[a];
              if (have[globalAtomIndex] > 0)
              {
-                fprintf(stderr, "DD rank %d: global atom %d occurs twice: index %d and %d\n", dd->rank, globalAtomIndex + 1, have[globalAtomIndex], a+1);
+                fprintf(stderr,
+                        "DD rank %d: global atom %d occurs twice: index %d and %d\n",
+                        dd->rank,
+                        globalAtomIndex + 1,
+                        have[globalAtomIndex],
+                        a + 1);
              }
              else
              {
@@ -601,15 +570,21 @@ static void check_index_consistency(gmx_domdec_t *dd,
  
      std::vector<int> have(numAtomsInZones);
  
-    int              ngl = 0;
+    int ngl = 0;
      for (int i = 0; i < natoms_sys; i++)
      {
-        if (const auto entry = dd->ga2la->find(i))
+        if (const auto* entry = dd->ga2la->find(i))
          {
              const int a = entry->la;
              if (a >= numAtomsInZones)
              {
-                fprintf(stderr, "DD rank %d: global atom %d marked as local atom %d, which is larger than nat_tot (%d)\n", dd->rank, i+1, a+1, numAtomsInZones);
+                fprintf(stderr,
+                        "DD rank %d: global atom %d marked as local atom %d, which is larger than "
+                        "nat_tot (%d)\n",
+                        dd->rank,
+                        i + 1,
+                        a + 1,
+                        numAtomsInZones);
                  nerr++;
              }
              else
@@ -617,7 +592,13 @@ static void check_index_consistency(gmx_domdec_t *dd,
                  have[a] = 1;
                  if (dd->globalAtomIndices[a] != i)
                  {
-                    fprintf(stderr, "DD rank %d: global atom %d marked as local atom %d, which has global atom index %d\n", dd->rank, i+1, a+1, dd->globalAtomIndices[a]+1);
+                    fprintf(stderr,
+                            "DD rank %d: global atom %d marked as local atom %d, which has global "
+                            "atom index %d\n",
+                            dd->rank,
+                            i + 1,
+                            a + 1,
+                            dd->globalAtomIndices[a] + 1);
                      nerr++;
                  }
              }
@@ -626,9 +607,7 @@ static void check_index_consistency(gmx_domdec_t *dd,
      }
      if (ngl != numAtomsInZones)
      {
-        fprintf(stderr,
-                "DD rank %d, %s: %d global atom indices, %d local atoms\n",
-                dd->rank, where, ngl, numAtomsInZones);
+        fprintf(stderr, "DD rank %d, %s: %d global atom indices, %d local atoms\n", dd->rank, where, ngl, numAtomsInZones);
      }
      for (int a = 0; a < numAtomsInZones; a++)
      {
@@ -636,30 +615,28 @@ static void check_index_consistency(gmx_domdec_t *dd,
          {
              fprintf(stderr,
                      "DD rank %d, %s: local atom %d, global %d has no global index\n",
-                    dd->rank, where, a + 1, dd->globalAtomIndices[a] + 1);
+                    dd->rank,
+                    where,
+                    a + 1,
+                    dd->globalAtomIndices[a] + 1);
          }
      }
  
-    nerr += check_bLocalCG(dd, ncg_sys, dd->comm->bLocalCG, where);
-
      if (nerr > 0)
      {
-        gmx_fatal(FARGS, "DD rank %d, %s: %d atom(group) index inconsistencies",
-                  dd->rank, where, nerr);
+        gmx_fatal(FARGS, "DD rank %d, %s: %d atom(group) index inconsistencies", dd->rank, where, nerr);
      }
  }
  
-//! Clear all DD global state indices, starting from \p atomGroupStart and \p atomStart
-static void clearDDStateIndices(gmx_domdec_t *dd,
-                                int           atomGroupStart,
-                                int           atomStart)
+//! Clear all DD global state indices
+static void clearDDStateIndices(gmx_domdec_t* dd, const bool keepLocalAtomIndices)
  {
-    gmx_ga2la_t &ga2la = *dd->ga2la;
+    gmx_ga2la_t& ga2la = *dd->ga2la;
  
-    if (atomStart == 0)
+    if (!keepLocalAtomIndices)
      {
          /* Clear the whole list without the overhead of searching */
-        ga2la.clear();
+        ga2la.clear(true);
      }
      else
      {
@@ -670,15 +647,6 @@ static void clearDDStateIndices(gmx_domdec_t *dd,
          }
      }
  
-    char *bLocalCG = dd->comm->bLocalCG;
-    if (bLocalCG)
-    {
-        for (size_t atomGroup = atomGroupStart; atomGroup < dd->globalAtomGroupIndices.size(); atomGroup++)
-        {
-            bLocalCG[dd->globalAtomGroupIndices[atomGroup]] = FALSE;
-        }
-    }
-
      dd_clear_local_vsite_indices(dd);
  
      if (dd->constraints)
@@ -687,57 +655,17 @@ static void clearDDStateIndices(gmx_domdec_t *dd,
      }
  }
  
-bool check_grid_jump(int64_t             step,
-                     const gmx_domdec_t *dd,
-                     real                cutoff,
-                     const gmx_ddbox_t  *ddbox,
-                     gmx_bool            bFatal)
-{
-    gmx_domdec_comm_t *comm    = dd->comm;
-    bool               invalid = false;
-
-    for (int d = 1; d < dd->ndim; d++)
-    {
-        const DDCellsizesWithDlb &cellsizes = comm->cellsizesWithDlb[d];
-        const int                 dim       = dd->dim[d];
-        const real                limit     = grid_jump_limit(comm, cutoff, d);
-        real                      bfac      = ddbox->box_size[dim];
-        if (ddbox->tric_dir[dim])
-        {
-            bfac *= ddbox->skew_fac[dim];
-        }
-        if ((cellsizes.fracUpper - cellsizes.fracLowerMax)*bfac <  limit ||
-            (cellsizes.fracLower - cellsizes.fracUpperMin)*bfac > -limit)
-        {
-            invalid = true;
-
-            if (bFatal)
-            {
-                char buf[22];
-
-                /* This error should never be triggered under normal
-                 * circumstances, but you never know ...
-                 */
-                gmx_fatal(FARGS, "step %s: The domain decomposition grid has shifted too much in the %c-direction around cell %d %d %d. This should not have happened. Running with fewer ranks might avoid this issue.",
-                          gmx_step_str(step, buf),
-                          dim2char(dim), dd->ci[XX], dd->ci[YY], dd->ci[ZZ]);
-            }
-        }
-    }
-
-    return invalid;
-}
  //! Return the duration of force calculations on this rank.
-static float dd_force_load(gmx_domdec_comm_t *comm)
+static float dd_force_load(gmx_domdec_comm_t* comm)
  {
      float load;
  
-    if (comm->eFlop)
+    if (comm->ddSettings.eFlop)
      {
          load = comm->flop;
-        if (comm->eFlop > 1)
+        if (comm->ddSettings.eFlop > 1)
          {
-            load *= 1.0 + (comm->eFlop - 1)*(0.1*rand()/RAND_MAX - 0.05);
+            load *= 1.0 + (comm->ddSettings.eFlop - 1) * (0.1 * rand() / RAND_MAX - 0.05);
          }
      }
      else
@@ -771,13 +699,12 @@ static float dd_force_load(gmx_domdec_comm_t *comm)
                   * is spurious CPU activity or MPI time, so we don't expect
                   * that changes in the GPU wait time matter a lot here.
                   */
-                gpu_wait *= (comm->cycl_n[ddCyclF] - 1)/static_cast<float>(comm->cycl_n[ddCyclF]);
+                gpu_wait *= (comm->cycl_n[ddCyclF] - 1) / static_cast<float>(comm->cycl_n[ddCyclF]);
              }
              /* Sum the wait times over the ranks that share the same GPU */
-            MPI_Allreduce(&gpu_wait, &gpu_wait_sum, 1, MPI_FLOAT, MPI_SUM,
-                          comm->mpi_comm_gpu_shared);
+            MPI_Allreduce(&gpu_wait, &gpu_wait_sum, 1, MPI_FLOAT, MPI_SUM, comm->mpi_comm_gpu_shared);
              /* Replace the wait time by the average over the ranks */
-            load += -gpu_wait + gpu_wait_sum/comm->nrank_gpu_shared;
+            load += -gpu_wait + gpu_wait_sum / comm->nrank_gpu_shared;
          }
  #endif
      }
@@ -786,12 +713,9 @@ static float dd_force_load(gmx_domdec_comm_t *comm)
  }
  
  //! Runs cell size checks and communicates the boundaries.
-static void comm_dd_ns_cell_sizes(gmx_domdec_t *dd,
-                                  gmx_ddbox_t *ddbox,
-                                  rvec cell_ns_x0, rvec cell_ns_x1,
-                                  int64_t step)
+static void comm_dd_ns_cell_sizes(gmx_domdec_t* dd, gmx_ddbox_t* ddbox, rvec cell_ns_x0, rvec cell_ns_x1, int64_t step)
  {
-    gmx_domdec_comm_t *comm;
+    gmx_domdec_comm_t* comm;
      int                dim_ind, dim;
  
      comm = dd->comm;
@@ -801,19 +725,23 @@ static void comm_dd_ns_cell_sizes(gmx_domdec_t *dd,
          dim = dd->dim[dim_ind];
  
          /* Without PBC we don't have restrictions on the outer cells */
-        if (!(dim >= ddbox->npbcdim &&
-              (dd->ci[dim] == 0 || dd->ci[dim] == dd->nc[dim] - 1)) &&
-            isDlbOn(comm) &&
-            (comm->cell_x1[dim] - comm->cell_x0[dim])*ddbox->skew_fac[dim] <
-            comm->cellsize_min[dim])
+        if (!(dim >= ddbox->npbcdim && (dd->ci[dim] == 0 || dd->ci[dim] == dd->numCells[dim] - 1))
+            && isDlbOn(comm)
+            && (comm->cell_x1[dim] - comm->cell_x0[dim]) * ddbox->skew_fac[dim] < comm->cellsize_min[dim])
          {
              char buf[22];
-            gmx_fatal(FARGS, "step %s: The %c-size (%f) times the triclinic skew factor (%f) is smaller than the smallest allowed cell size (%f) for domain decomposition grid cell %d %d %d",
-                      gmx_step_str(step, buf), dim2char(dim),
+            gmx_fatal(FARGS,
+                      "step %s: The %c-size (%f) times the triclinic skew factor (%f) is smaller "
+                      "than the smallest allowed cell size (%f) for domain decomposition grid cell "
+                      "%d %d %d",
+                      gmx_step_str(step, buf),
+                      dim2char(dim),
                        comm->cell_x1[dim] - comm->cell_x0[dim],
                        ddbox->skew_fac[dim],
                        dd->comm->cellsize_min[dim],
-                      dd->ci[XX], dd->ci[YY], dd->ci[ZZ]);
+                      dd->ci[XX],
+                      dd->ci[YY],
+                      dd->ci[ZZ]);
          }
      }
  
@@ -823,16 +751,16 @@ static void comm_dd_ns_cell_sizes(gmx_domdec_t *dd,
          dd_move_cellx(dd, ddbox, cell_ns_x0, cell_ns_x1);
          if (isDlbOn(dd->comm) && dd->ndim > 1)
          {
-            check_grid_jump(step, dd, dd->comm->systemInfo.cutoff, ddbox, TRUE);
+            gmx::check_grid_jump(step, dd, dd->comm->systemInfo.cutoff, ddbox, TRUE);
          }
      }
  }
  
  //! Compute and communicate to determine the load distribution across PP ranks.
-static void get_load_distribution(gmx_domdec_t *dd, gmx_wallcycle_t wcycle)
+static void get_load_distribution(gmx_domdec_t* dd, gmx_wallcycle* wcycle)
  {
-    gmx_domdec_comm_t *comm;
-    domdec_load_t     *load;
+    gmx_domdec_comm_t* comm;
+    domdec_load_t*     load;
      float              cell_frac = 0, sbuf[DD_NLOAD_MAX];
      gmx_bool           bSepPME;
  
@@ -841,7 +769,7 @@ static void get_load_distribution(gmx_domdec_t *dd, gmx_wallcycle_t wcycle)
          fprintf(debug, "get_load_distribution start\n");
      }
  
-    wallcycle_start(wcycle, ewcDDCOMMLOAD);
+    wallcycle_start(wcycle, WallCycleCounter::DDCommLoad);
  
      comm = dd->comm;
  
@@ -854,21 +782,22 @@ static void get_load_distribution(gmx_domdec_t *dd, gmx_wallcycle_t wcycle)
          comm->load[0].pme = comm->cycl[ddCyclPME];
      }
  
+    // Either we have DLB off, or we have it on and the array is large enough
+    GMX_ASSERT(!isDlbOn(dd->comm) || static_cast<int>(dd->comm->cellsizesWithDlb.size()) == dd->ndim,
+               "DLB cell sizes data not set up properly ");
      for (int d = dd->ndim - 1; d >= 0; d--)
      {
-        const DDCellsizesWithDlb *cellsizes = (isDlbOn(dd->comm) ? &comm->cellsizesWithDlb[d] : nullptr);
-        const int                 dim       = dd->dim[d];
+        const int dim = dd->dim[d];
          /* Check if we participate in the communication in this dimension */
-        if (d == dd->ndim-1 ||
-            (dd->ci[dd->dim[d+1]] == 0 && dd->ci[dd->dim[dd->ndim-1]] == 0))
+        if (d == dd->ndim - 1 || (dd->ci[dd->dim[d + 1]] == 0 && dd->ci[dd->dim[dd->ndim - 1]] == 0))
          {
              load = &comm->load[d];
              if (isDlbOn(dd->comm))
              {
-                cell_frac = cellsizes->fracUpper - cellsizes->fracLower;
+                cell_frac = comm->cellsizesWithDlb[d].fracUpper - comm->cellsizesWithDlb[d].fracLower;
              }
              int pos = 0;
-            if (d == dd->ndim-1)
+            if (d == dd->ndim - 1)
              {
                  sbuf[pos++] = dd_force_load(comm);
                  sbuf[pos++] = sbuf[0];
@@ -878,8 +807,8 @@ static void get_load_distribution(gmx_domdec_t *dd, gmx_wallcycle_t wcycle)
                      sbuf[pos++] = cell_frac;
                      if (d > 0)
                      {
-                        sbuf[pos++] = cellsizes->fracLowerMax;
-                        sbuf[pos++] = cellsizes->fracUpperMin;
+                        sbuf[pos++] = comm->cellsizesWithDlb[d].fracLowerMax;
+                        sbuf[pos++] = comm->cellsizesWithDlb[d].fracUpperMin;
                      }
                  }
                  if (bSepPME)
@@ -890,23 +819,23 @@ static void get_load_distribution(gmx_domdec_t *dd, gmx_wallcycle_t wcycle)
              }
              else
              {
-                sbuf[pos++] = comm->load[d+1].sum;
-                sbuf[pos++] = comm->load[d+1].max;
+                sbuf[pos++] = comm->load[d + 1].sum;
+                sbuf[pos++] = comm->load[d + 1].max;
                  if (isDlbOn(dd->comm))
                  {
-                    sbuf[pos++] = comm->load[d+1].sum_m;
-                    sbuf[pos++] = comm->load[d+1].cvol_min*cell_frac;
-                    sbuf[pos++] = comm->load[d+1].flags;
+                    sbuf[pos++] = comm->load[d + 1].sum_m;
+                    sbuf[pos++] = comm->load[d + 1].cvol_min * cell_frac;
+                    sbuf[pos++] = comm->load[d + 1].flags;
                      if (d > 0)
                      {
-                        sbuf[pos++] = cellsizes->fracLowerMax;
-                        sbuf[pos++] = cellsizes->fracUpperMin;
+                        sbuf[pos++] = comm->cellsizesWithDlb[d].fracLowerMax;
+                        sbuf[pos++] = comm->cellsizesWithDlb[d].fracUpperMin;
                      }
                  }
                  if (bSepPME)
                  {
-                    sbuf[pos++] = comm->load[d+1].mdf;
-                    sbuf[pos++] = comm->load[d+1].pme;
+                    sbuf[pos++] = comm->load[d + 1].mdf;
+                    sbuf[pos++] = comm->load[d + 1].pme;
                  }
              }
              load->nload = pos;
@@ -914,18 +843,23 @@ static void get_load_distribution(gmx_domdec_t *dd, gmx_wallcycle_t wcycle)
               * The communicators are setup such that the root always has rank 0.
               */
  #if GMX_MPI
-            MPI_Gather(sbuf, load->nload*sizeof(float), MPI_BYTE,
-                       load->load, load->nload*sizeof(float), MPI_BYTE,
-                       0, comm->mpi_comm_load[d]);
+            MPI_Gather(sbuf,
+                       load->nload * sizeof(float),
+                       MPI_BYTE,
+                       load->load,
+                       load->nload * sizeof(float),
+                       MPI_BYTE,
+                       0,
+                       comm->mpi_comm_load[d]);
  #endif
              if (dd->ci[dim] == dd->master_ci[dim])
              {
                  /* We are the master along this row, process this row */
-                RowMaster *rowMaster = nullptr;
+                RowMaster* rowMaster = nullptr;
  
                  if (isDlbOn(comm))
                  {
-                    rowMaster = cellsizes->rowMaster.get();
+                    rowMaster = comm->cellsizesWithDlb[d].rowMaster.get();
                  }
                  load->sum      = 0;
                  load->max      = 0;
@@ -935,10 +869,10 @@ static void get_load_distribution(gmx_domdec_t *dd, gmx_wallcycle_t wcycle)
                  load->mdf      = 0;
                  load->pme      = 0;
                  int pos        = 0;
-                for (int i = 0; i < dd->nc[dim]; i++)
+                for (int i = 0; i < dd->numCells[dim]; i++)
                  {
                      load->sum += load->load[pos++];
-                    load->max  = std::max(load->max, load->load[pos]);
+                    load->max = std::max(load->max, load->load[pos]);
                      pos++;
                      if (isDlbOn(dd->comm))
                      {
@@ -956,7 +890,7 @@ static void get_load_distribution(gmx_domdec_t *dd, gmx_wallcycle_t wcycle)
                          pos++;
                          load->cvol_min = std::min(load->cvol_min, load->load[pos]);
                          pos++;
-                        if (d < dd->ndim-1)
+                        if (d < dd->ndim - 1)
                          {
                              load->flags = gmx::roundToInt(load->load[pos++]);
                          }
@@ -976,8 +910,8 @@ static void get_load_distribution(gmx_domdec_t *dd, gmx_wallcycle_t wcycle)
                  }
                  if (isDlbOn(comm) && rowMaster->dlbIsLimited)
                  {
-                    load->sum_m *= dd->nc[dim];
-                    load->flags |= (1<<d);
+                    load->sum_m *= dd->numCells[dim];
+                    load->flags |= (1 << d);
                  }
              }
          }
@@ -985,15 +919,15 @@ static void get_load_distribution(gmx_domdec_t *dd, gmx_wallcycle_t wcycle)
  
      if (DDMASTER(dd))
      {
-        comm->nload      += dd_load_count(comm);
-        comm->load_step  += comm->cycl[ddCyclStep];
-        comm->load_sum   += comm->load[0].sum;
-        comm->load_max   += comm->load[0].max;
+        comm->nload += dd_load_count(comm);
+        comm->load_step += comm->cycl[ddCyclStep];
+        comm->load_sum += comm->load[0].sum;
+        comm->load_max += comm->load[0].max;
          if (isDlbOn(comm))
          {
              for (int d = 0; d < dd->ndim; d++)
              {
-                if (comm->load[0].flags & (1<<d))
+                if (comm->load[0].flags & (1 << d))
                  {
                      comm->load_lim[d]++;
                  }
@@ -1006,7 +940,7 @@ static void get_load_distribution(gmx_domdec_t *dd, gmx_wallcycle_t wcycle)
          }
      }
  
-    wallcycle_stop(wcycle, ewcDDCOMMLOAD);
+    wallcycle_stop(wcycle, WallCycleCounter::DDCommLoad);
  
      if (debug)
      {
@@ -1016,11 +950,11 @@ static void get_load_distribution(gmx_domdec_t *dd, gmx_wallcycle_t wcycle)
  
  /*! \brief Return the relative performance loss on the total run time
   * due to the force calculation load imbalance. */
-static float dd_force_load_fraction(gmx_domdec_t *dd)
+static float dd_force_load_fraction(gmx_domdec_t* dd)
  {
      if (dd->comm->nload > 0 && dd->comm->load_step > 0)
      {
-        return dd->comm->load_sum/(dd->comm->load_step*dd->nnodes);
+        return dd->comm->load_sum / (dd->comm->load_step * dd->nnodes);
      }
      else
      {
@@ -1030,13 +964,11 @@ static float dd_force_load_fraction(gmx_domdec_t *dd)
  
  /*! \brief Return the relative performance loss on the total run time
   * due to the force calculation load imbalance. */
-static float dd_force_imb_perf_loss(gmx_domdec_t *dd)
+static float dd_force_imb_perf_loss(gmx_domdec_t* dd)
  {
      if (dd->comm->nload > 0 && dd->comm->load_step > 0)
      {
-        return
-            (dd->comm->load_max*dd->nnodes - dd->comm->load_sum)/
-            (dd->comm->load_step*dd->nnodes);
+        return (dd->comm->load_max * dd->nnodes - dd->comm->load_sum) / (dd->comm->load_step * dd->nnodes);
      }
      else
      {
@@ -1045,9 +977,9 @@ static float dd_force_imb_perf_loss(gmx_domdec_t *dd)
  }
  
  //! Print load-balance report e.g. at the end of a run.
-static void print_dd_load_av(FILE *fplog, gmx_domdec_t *dd)
+static void print_dd_load_av(FILE* fplog, gmx_domdec_t* dd)
  {
-    gmx_domdec_comm_t *comm = dd->comm;
+    gmx_domdec_comm_t* comm = dd->comm;
  
      /* Only the master rank prints loads and only if we measured loads */
      if (!DDMASTER(dd) || comm->nload == 0)
@@ -1055,19 +987,19 @@ static void print_dd_load_av(FILE *fplog, gmx_domdec_t *dd)
          return;
      }
  
-    char  buf[STRLEN];
-    int   numPpRanks   = dd->nnodes;
-    int   numPmeRanks  = (dd->pme_nodeid >= 0) ? comm->npmenodes : 0;
-    int   numRanks     = numPpRanks + numPmeRanks;
+    char buf[STRLEN];
+    int  numPpRanks  = dd->nnodes;
+    int  numPmeRanks = (comm->ddRankSetup.usePmeOnlyRanks ? comm->ddRankSetup.numRanksDoingPme : 0);
+    int  numRanks    = numPpRanks + numPmeRanks;
      float lossFraction = 0;
  
      /* Print the average load imbalance and performance loss */
      if (dd->nnodes > 1 && comm->load_sum > 0)
      {
-        float imbalance = comm->load_max*numPpRanks/comm->load_sum - 1;
+        float imbalance = comm->load_max * numPpRanks / comm->load_sum - 1;
          lossFraction    = dd_force_imb_perf_loss(dd);
  
-        std::string msg         = "\nDynamic load balancing report:\n";
+        std::string msg = "\nDynamic load balancing report:\n";
          std::string dlbStateStr;
  
          switch (dd->comm->dlbState)
@@ -1085,7 +1017,9 @@ static void print_dd_load_av(FILE *fplog, gmx_domdec_t *dd)
                  dlbStateStr = "DLB was off during the run due to low measured imbalance.";
                  break;
              case DlbState::offTemporarilyLocked:
-                dlbStateStr = "DLB was locked at the end of the run due to unfinished PP-PME balancing.";
+                dlbStateStr =
+                        "DLB was locked at the end of the run due to unfinished PP-PME "
+                        "balancing.";
                  break;
              case DlbState::onCanTurnOff:
                  dlbStateStr = "DLB was turned on during the run due to measured imbalance.";
@@ -1093,16 +1027,18 @@ static void print_dd_load_av(FILE *fplog, gmx_domdec_t *dd)
              case DlbState::onUser:
                  dlbStateStr = "DLB was permanently on during the run per user request.";
                  break;
-            default:
-                GMX_ASSERT(false, "Undocumented DLB state");
+            default: GMX_ASSERT(false, "Undocumented DLB state");
          }
  
          msg += " " + dlbStateStr + "\n";
-        msg += gmx::formatString(" Average load imbalance: %.1f%%.\n", imbalance*100);
-        msg += gmx::formatString(" The balanceable part of the MD step is %d%%, load imbalance is computed from this.\n",
-                                 gmx::roundToInt(dd_force_load_fraction(dd)*100));
-        msg += gmx::formatString(" Part of the total run time spent waiting due to load imbalance: %.1f%%.\n",
-                                 lossFraction*100);
+        msg += gmx::formatString(" Average load imbalance: %.1f%%.\n", imbalance * 100);
+        msg += gmx::formatString(
+                " The balanceable part of the MD step is %d%%, load imbalance is computed from "
+                "this.\n",
+                gmx::roundToInt(dd_force_load_fraction(dd) * 100));
+        msg += gmx::formatString(
+                " Part of the total run time spent waiting due to load imbalance: %.1f%%.\n",
+                lossFraction * 100);
          fprintf(fplog, "%s", msg.c_str());
          fprintf(stderr, "\n%s", msg.c_str());
      }
@@ -1114,9 +1050,8 @@ static void print_dd_load_av(FILE *fplog, gmx_domdec_t *dd)
          sprintf(buf, " Steps where the load balancing was limited by -rdd, -rcon and/or -dds:");
          for (int d = 0; d < dd->ndim; d++)
          {
-            int limitPercentage = (200*comm->load_lim[d] + 1)/(2*comm->nload);
-            sprintf(buf+strlen(buf), " %c %d %%",
-                    dim2char(dd->dim[d]), limitPercentage);
+            int limitPercentage = (200 * comm->load_lim[d] + 1) / (2 * comm->nload);
+            sprintf(buf + strlen(buf), " %c %d %%", dim2char(dd->dim[d]), limitPercentage);
              if (limitPercentage >= 50)
              {
                  dlbWasLimited = true;
@@ -1131,49 +1066,60 @@ static void print_dd_load_av(FILE *fplog, gmx_domdec_t *dd)
      float lossFractionPme = 0;
      if (numPmeRanks > 0 && comm->load_mdf > 0 && comm->load_step > 0)
      {
-        float pmeForceRatio = comm->load_pme/comm->load_mdf;
-        lossFractionPme     = (comm->load_pme - comm->load_mdf)/comm->load_step;
+        float pmeForceRatio = comm->load_pme / comm->load_mdf;
+        lossFractionPme     = (comm->load_pme - comm->load_mdf) / comm->load_step;
          if (lossFractionPme <= 0)
          {
-            lossFractionPme *= numPmeRanks/static_cast<float>(numRanks);
+            lossFractionPme *= numPmeRanks / static_cast<float>(numRanks);
          }
          else
          {
-            lossFractionPme *= numPpRanks/static_cast<float>(numRanks);
+            lossFractionPme *= numPpRanks / static_cast<float>(numRanks);
          }
          sprintf(buf, " Average PME mesh/force load: %5.3f\n", pmeForceRatio);
          fprintf(fplog, "%s", buf);
          fprintf(stderr, "%s", buf);
-        sprintf(buf, " Part of the total run time spent waiting due to PP/PME imbalance: %.1f %%\n", std::fabs(lossFractionPme)*100);
+        sprintf(buf,
+                " Part of the total run time spent waiting due to PP/PME imbalance: %.1f %%\n",
+                std::fabs(lossFractionPme) * 100);
          fprintf(fplog, "%s", buf);
          fprintf(stderr, "%s", buf);
      }
      fprintf(fplog, "\n");
      fprintf(stderr, "\n");
  
-    if (lossFraction >= DD_PERF_LOSS_WARN)
+    if ((lossFraction >= DD_PERF_LOSS_WARN) && (dd->comm->dlbState != DlbState::offTemporarilyLocked))
      {
          std::string message = gmx::formatString(
-                    "NOTE: %.1f %% of the available CPU time was lost due to load imbalance\n"
-                    "      in the domain decomposition.\n", lossFraction*100);
+                "NOTE: %.1f %% of the available CPU time was lost due to load imbalance\n"
+                "      in the domain decomposition.\n",
+                lossFraction * 100);
  
          bool hadSuggestion = false;
-        if (!isDlbOn(comm))
+        if (dd->comm->dlbState == DlbState::offUser)
+        {
+            message += "      You might want to allow dynamic load balancing (option -dlb auto.)\n";
+            hadSuggestion = true;
+        }
+        else if (dd->comm->dlbState == DlbState::offCanTurnOn)
          {
-            message      += "      You might want to use dynamic load balancing (option -dlb.)\n";
+            message +=
+                    "      Dynamic load balancing was automatically disabled, but it might be "
+                    "beneficial to manually tuning it on (option -dlb on.)\n";
              hadSuggestion = true;
          }
          else if (dlbWasLimited)
          {
-            message      += "      You might want to decrease the cell size limit (options -rdd, -rcon and/or -dds).\n";
+            message +=
+                    "      You might want to decrease the cell size limit (options -rdd, -rcon "
+                    "and/or -dds).\n";
              hadSuggestion = true;
          }
          message += gmx::formatString(
-                    "      You can %sconsider manually changing the decomposition (option -dd);\n"
-                    "      e.g. by using fewer domains along the box dimension in which there is\n"
-                    "      considerable inhomogeneity in the simulated system.",
-                    hadSuggestion ? "also " : "");
-
+                "      You can %sconsider manually changing the decomposition (option -dd);\n"
+                "      e.g. by using fewer domains along the box dimension in which there is\n"
+                "      considerable inhomogeneity in the simulated system.",
+                hadSuggestion ? "also " : "");
  
          fprintf(fplog, "%s\n", message.c_str());
          fprintf(stderr, "%s\n", message.c_str());
@@ -1185,8 +1131,8 @@ static void print_dd_load_av(FILE *fplog, gmx_domdec_t *dd)
                  "      had %s work to do than the PP ranks.\n"
                  "      You might want to %s the number of PME ranks\n"
                  "      or %s the cut-off and the grid spacing.\n",
-                std::fabs(lossFractionPme*100),
-                (lossFractionPme < 0) ? "less"     : "more",
+                std::fabs(lossFractionPme * 100),
+                (lossFractionPme < 0) ? "less" : "more",
                  (lossFractionPme < 0) ? "decrease" : "increase",
                  (lossFractionPme < 0) ? "decrease" : "increase");
          fprintf(fplog, "%s\n", buf);
@@ -1195,23 +1141,23 @@ static void print_dd_load_av(FILE *fplog, gmx_domdec_t *dd)
  }
  
  //! Return the minimum communication volume.
-static float dd_vol_min(gmx_domdec_t *dd)
+static float dd_vol_min(gmx_domdec_t* dd)
  {
-    return dd->comm->load[0].cvol_min*dd->nnodes;
+    return dd->comm->load[0].cvol_min * dd->nnodes;
  }
  
  //! Return the DD load flags.
-static int dd_load_flags(gmx_domdec_t *dd)
+static int dd_load_flags(gmx_domdec_t* dd)
  {
      return dd->comm->load[0].flags;
  }
  
  //! Return the reported load imbalance in force calculations.
-static float dd_f_imbal(gmx_domdec_t *dd)
+static float dd_f_imbal(gmx_domdec_t* dd)
  {
      if (dd->comm->load[0].sum > 0)
      {
-        return dd->comm->load[0].max*dd->nnodes/dd->comm->load[0].sum - 1.0F;
+        return dd->comm->load[0].max * dd->nnodes / dd->comm->load[0].sum - 1.0F;
      }
      else
      {
@@ -1221,20 +1167,18 @@ static float dd_f_imbal(gmx_domdec_t *dd)
  }
  
  //! Returns DD load balance report.
-static std::string
-dd_print_load(gmx_domdec_t *dd,
-              int64_t       step)
+static std::string dd_print_load(gmx_domdec_t* dd, int64_t step)
  {
      gmx::StringOutputStream stream;
      gmx::TextWriter         log(&stream);
  
-    int                     flags = dd_load_flags(dd);
+    int flags = dd_load_flags(dd);
      if (flags)
      {
          log.writeString("DD  load balancing is limited by minimum cell size in dimension");
          for (int d = 0; d < dd->ndim; d++)
          {
-            if (flags & (1<<d))
+            if (flags & (1 << d))
              {
                  log.writeStringFormatted(" %c", dim2char(dd->dim[d]));
              }
@@ -1244,12 +1188,11 @@ dd_print_load(gmx_domdec_t *dd,
      log.writeString("DD  step " + gmx::toString(step));
      if (isDlbOn(dd->comm))
      {
-        log.writeStringFormatted("  vol min/aver %5.3f%c",
-                                 dd_vol_min(dd), flags ? '!' : ' ');
+        log.writeStringFormatted("  vol min/aver %5.3f%c", dd_vol_min(dd), flags ? '!' : ' ');
      }
      if (dd->nnodes > 1)
      {
-        log.writeStringFormatted(" load imb.: force %4.1f%%", dd_f_imbal(dd)*100);
+        log.writeStringFormatted(" load imb.: force %4.1f%%", dd_f_imbal(dd) * 100);
      }
      if (dd->comm->cycl_n[ddCyclPME])
      {
@@ -1260,16 +1203,15 @@ dd_print_load(gmx_domdec_t *dd,
  }
  
  //! Prints DD load balance report in mdrun verbose mode.
-static void dd_print_load_verbose(gmx_domdec_t *dd)
+static void dd_print_load_verbose(gmx_domdec_t* dd)
  {
      if (isDlbOn(dd->comm))
      {
-        fprintf(stderr, "vol %4.2f%c ",
-                dd_vol_min(dd), dd_load_flags(dd) ? '!' : ' ');
+        fprintf(stderr, "vol %4.2f%c ", dd_vol_min(dd), dd_load_flags(dd) ? '!' : ' ');
      }
      if (dd->nnodes > 1)
      {
-        fprintf(stderr, "imb F %2d%% ", gmx::roundToInt(dd_f_imbal(dd)*100));
+        fprintf(stderr, "imb F %2d%% ", gmx::roundToInt(dd_f_imbal(dd) * 100));
      }
      if (dd->comm->cycl_n[ddCyclPME])
      {
@@ -1278,41 +1220,45 @@ static void dd_print_load_verbose(gmx_domdec_t *dd)
  }
  
  //! Turns on dynamic load balancing if possible and needed.
-static void turn_on_dlb(const gmx::MDLogger &mdlog,
-                        gmx_domdec_t        *dd,
-                        int64_t              step)
+static void turn_on_dlb(const gmx::MDLogger& mdlog, gmx_domdec_t* dd, int64_t step)
  {
-    gmx_domdec_comm_t *comm         = dd->comm;
+    gmx_domdec_comm_t* comm = dd->comm;
  
-    real               cellsize_min = comm->cellsize_min[dd->dim[0]];
+    real cellsize_min = comm->cellsize_min[dd->dim[0]];
      for (int d = 1; d < dd->ndim; d++)
      {
          cellsize_min = std::min(cellsize_min, comm->cellsize_min[dd->dim[d]]);
      }
  
      /* Turn off DLB if we're too close to the cell size limit. */
-    if (cellsize_min < comm->cellsize_limit*1.05)
+    if (cellsize_min < comm->cellsize_limit * 1.05)
      {
-        GMX_LOG(mdlog.info).appendTextFormatted(
-                "step %s Measured %.1f %% performance loss due to load imbalance, "
-                "but the minimum cell size is smaller than 1.05 times the cell size limit. "
-                "Will no longer try dynamic load balancing.",
-                gmx::toString(step).c_str(), dd_force_imb_perf_loss(dd)*100);
+        GMX_LOG(mdlog.info)
+                .appendTextFormatted(
+                        "step %s Measured %.1f %% performance loss due to load imbalance, "
+                        "but the minimum cell size is smaller than 1.05 times the cell size limit. "
+                        "Will no longer try dynamic load balancing.",
+                        gmx::toString(step).c_str(),
+                        dd_force_imb_perf_loss(dd) * 100);
  
          comm->dlbState = DlbState::offForever;
          return;
      }
  
-    GMX_LOG(mdlog.info).appendTextFormatted(
-            "step %s Turning on dynamic load balancing, because the performance loss due to load imbalance is %.1f %%.",
-            gmx::toString(step).c_str(), dd_force_imb_perf_loss(dd)*100);
+    GMX_LOG(mdlog.info)
+            .appendTextFormatted(
+                    "step %s Turning on dynamic load balancing, because the performance loss due "
+                    "to load imbalance is %.1f %%.",
+                    gmx::toString(step).c_str(),
+                    dd_force_imb_perf_loss(dd) * 100);
      comm->dlbState = DlbState::onCanTurnOff;
  
      /* Store the non-DLB performance, so we can check if DLB actually
       * improves performance.
       */
-    GMX_RELEASE_ASSERT(comm->cycl_n[ddCyclStep] > 0, "When we turned on DLB, we should have measured cycles");
-    comm->cyclesPerStepBeforeDLB = comm->cycl[ddCyclStep]/comm->cycl_n[ddCyclStep];
+    GMX_RELEASE_ASSERT(comm->cycl_n[ddCyclStep] > 0,
+                       "When we turned on DLB, we should have measured cycles");
+    comm->cyclesPerStepBeforeDLB = comm->cycl[ddCyclStep] / comm->cycl_n[ddCyclStep];
  
      set_dlb_limits(dd);
  
@@ -1322,20 +1268,20 @@ static void turn_on_dlb(const gmx::MDLogger &mdlog,
       */
      for (int d = 0; d < dd->ndim; d++)
      {
-        RowMaster *rowMaster = comm->cellsizesWithDlb[d].rowMaster.get();
+        RowMaster* rowMaster = comm->cellsizesWithDlb[d].rowMaster.get();
  
          if (rowMaster)
          {
              comm->load[d].sum_m = comm->load[d].sum;
  
-            int nc = dd->nc[dd->dim[d]];
+            int nc = dd->numCells[dd->dim[d]];
              for (int i = 0; i < nc; i++)
              {
-                rowMaster->cellFrac[i] = i/static_cast<real>(nc);
+                rowMaster->cellFrac[i] = i / static_cast<real>(nc);
                  if (d > 0)
                  {
-                    rowMaster->bounds[i].cellFracLowerMax =  i     /static_cast<real>(nc);
-                    rowMaster->bounds[i].cellFracUpperMin = (i + 1)/static_cast<real>(nc);
+                    rowMaster->bounds[i].cellFracLowerMax = i / static_cast<real>(nc);
+                    rowMaster->bounds[i].cellFracUpperMin = (i + 1) / static_cast<real>(nc);
                  }
              }
              rowMaster->cellFrac[nc] = 1.0;
@@ -1344,31 +1290,32 @@ static void turn_on_dlb(const gmx::MDLogger &mdlog,
  }
  
  //! Turns off dynamic load balancing (but leave it able to turn back on).
-static void turn_off_dlb(const gmx::MDLogger &mdlog,
-                         gmx_domdec_t        *dd,
-                         int64_t              step)
+static void turn_off_dlb(const gmx::MDLogger& mdlog, gmx_domdec_t* dd, int64_t step)
  {
-    GMX_LOG(mdlog.info).appendText(
-            "step " + gmx::toString(step) + " Turning off dynamic load balancing, because it is degrading performance.");
+    GMX_LOG(mdlog.info)
+            .appendText(
+                    "step " + gmx::toString(step)
+                    + " Turning off dynamic load balancing, because it is degrading performance.");
      dd->comm->dlbState                     = DlbState::offCanTurnOn;
      dd->comm->haveTurnedOffDlb             = true;
      dd->comm->ddPartioningCountFirstDlbOff = dd->ddp_count;
  }
  
  //! Turns off dynamic load balancing permanently.
-static void turn_off_dlb_forever(const gmx::MDLogger &mdlog,
-                                 gmx_domdec_t        *dd,
-                                 int64_t              step)
+static void turn_off_dlb_forever(const gmx::MDLogger& mdlog, gmx_domdec_t* dd, int64_t step)
  {
-    GMX_RELEASE_ASSERT(dd->comm->dlbState == DlbState::offCanTurnOn, "Can only turn off DLB forever when it was in the can-turn-on state");
-    GMX_LOG(mdlog.info).appendText(
-            "step " + gmx::toString(step) + " Will no longer try dynamic load balancing, as it degraded performance.");
+    GMX_RELEASE_ASSERT(dd->comm->dlbState == DlbState::offCanTurnOn,
+                       "Can only turn off DLB forever when it was in the can-turn-on state");
+    GMX_LOG(mdlog.info)
+            .appendText(
+                    "step " + gmx::toString(step)
+                    + " Will no longer try dynamic load balancing, as it degraded performance.");
      dd->comm->dlbState = DlbState::offForever;
  }
  
-void set_dd_dlb_max_cutoff(t_commrec *cr, real cutoff)
+void set_dd_dlb_max_cutoff(t_commrec* cr, real cutoff)
  {
-    gmx_domdec_comm_t *comm;
+    gmx_domdec_comm_t* comm;
  
      comm = cr->dd->comm;
  
@@ -1380,21 +1327,24 @@ void set_dd_dlb_max_cutoff(t_commrec *cr, real cutoff)
  
      if (debug)
      {
-        fprintf(debug, "PME load balancing set a limit to the DLB staggering such that a %f cut-off will continue to fit\n",
+        fprintf(debug,
+                "PME load balancing set a limit to the DLB staggering such that a %f cut-off will "
+                "continue to fit\n",
                  comm->PMELoadBal_max_cutoff);
      }
  }
  
  //! Merge atom buffers.
-static void merge_cg_buffers(int ncell,
-                             gmx_domdec_comm_dim_t *cd, int pulse,
-                             int  *ncg_cell,
-                             gmx::ArrayRef<int> index_gl,
-                             const int  *recv_i,
-                             gmx::ArrayRef<gmx::RVec> x,
-                             gmx::ArrayRef<const gmx::RVec> recv_vr,
-                             cginfo_mb_t *cginfo_mb,
-                             gmx::ArrayRef<int> cginfo)
+static void merge_cg_buffers(int                                             ncell,
+                             gmx_domdec_comm_dim_t*                          cd,
+                             int                                             pulse,
+                             int*                                            ncg_cell,
+                             gmx::ArrayRef<int>                              index_gl,
+                             const int*                                      recv_i,
+                             gmx::ArrayRef<gmx::RVec>                        x,
+                             gmx::ArrayRef<const gmx::RVec>                  recv_vr,
+                             gmx::ArrayRef<gmx::AtomInfoWithinMoleculeBlock> atomInfoForEachMoleculeBlock,
+                             gmx::ArrayRef<int64_t>                          atomInfo)
  {
      gmx_domdec_ind_t *ind, *ind_p;
      int               p, cell, c, cg, cg0, cg1, cg_gl;
@@ -1404,19 +1354,19 @@ static void merge_cg_buffers(int ncell,
  
      /* First correct the already stored data */
      shift = ind->nrecv[ncell];
-    for (cell = ncell-1; cell >= 0; cell--)
+    for (cell = ncell - 1; cell >= 0; cell--)
      {
          shift -= ind->nrecv[cell];
          if (shift > 0)
          {
              /* Move the cg's present from previous grid pulses */
-            cg0                = ncg_cell[ncell+cell];
-            cg1                = ncg_cell[ncell+cell+1];
-            for (cg = cg1-1; cg >= cg0; cg--)
+            cg0 = ncg_cell[ncell + cell];
+            cg1 = ncg_cell[ncell + cell + 1];
+            for (cg = cg1 - 1; cg >= cg0; cg--)
              {
                  index_gl[cg + shift] = index_gl[cg];
                  x[cg + shift]        = x[cg];
-                cginfo[cg + shift]   = cginfo[cg];
+                atomInfo[cg + shift] = atomInfo[cg];
              }
              /* Correct the already stored send indices for the shift */
              for (p = 1; p <= pulse; p++)
@@ -1437,66 +1387,61 @@ static void merge_cg_buffers(int ncell,
      }
  
      /* Merge in the communicated buffers */
-    shift    = 0;
-    cg0      = 0;
+    shift = 0;
+    cg0   = 0;
      for (cell = 0; cell < ncell; cell++)
      {
-        cg1 = ncg_cell[ncell+cell+1] + shift;
+        cg1 = ncg_cell[ncell + cell + 1] + shift;
          for (cg = 0; cg < ind->nrecv[cell]; cg++)
          {
              /* Copy this atom from the buffer */
              index_gl[cg1] = recv_i[cg0];
              x[cg1]        = recv_vr[cg0];
              /* Copy information */
-            cg_gl          = index_gl[cg1];
-            cginfo[cg1]    = ddcginfo(cginfo_mb, cg_gl);
+            cg_gl         = index_gl[cg1];
+            atomInfo[cg1] = ddGetAtomInfo(atomInfoForEachMoleculeBlock, cg_gl);
              cg0++;
              cg1++;
          }
-        shift                 += ind->nrecv[cell];
-        ncg_cell[ncell+cell+1] = cg1;
+        shift += ind->nrecv[cell];
+        ncg_cell[ncell + cell + 1] = cg1;
      }
  }
  
  //! Makes a range partitioning for the atom groups wthin a cell
-static void make_cell2at_index(gmx_domdec_comm_dim_t        *cd,
-                               int                           nzone,
-                               int                           atomGroupStart)
+static void make_cell2at_index(gmx_domdec_comm_dim_t* cd, int nzone, int atomGroupStart)
  {
      /* Store the atom block boundaries for easy copying of communication buffers
       */
      int g = atomGroupStart;
      for (int zone = 0; zone < nzone; zone++)
      {
-        for (gmx_domdec_ind_t &ind : cd->ind)
+        for (gmx_domdec_ind_t& ind : cd->ind)
          {
-            ind.cell2at0[zone]  = g;
-            g                  += ind.nrecv[zone];
-            ind.cell2at1[zone]  = g;
+            ind.cell2at0[zone] = g;
+            g += ind.nrecv[zone];
+            ind.cell2at1[zone] = g;
          }
      }
  }
  
  //! Returns whether a link is missing.
-static gmx_bool missing_link(t_blocka *link, int cg_gl, const char *bLocalCG)
+static gmx_bool missing_link(const t_blocka& link, const int globalAtomIndex, const gmx_ga2la_t& ga2la)
  {
-    int      i;
-    gmx_bool bMiss;
-
-    bMiss = FALSE;
-    for (i = link->index[cg_gl]; i < link->index[cg_gl+1]; i++)
+    for (int i = link.index[globalAtomIndex]; i < link.index[globalAtomIndex + 1]; i++)
      {
-        if (!bLocalCG[link->a[i]])
+        if (!ga2la.findHome(link.a[i]))
          {
-            bMiss = TRUE;
+            return true;
          }
      }
  
-    return bMiss;
+    return false;
  }
  
  //! Domain corners for communication, a maximum of 4 i-zones see a j domain
-typedef struct {
+typedef struct
+{
      //! The corners for the non-bonded communication.
      real c[DIM][4];
      //! Corner for rounding.
@@ -1510,15 +1455,10 @@ typedef struct {
  } dd_corners_t;
  
  //! Determine the corners of the domain(s) we are communicating with.
-static void
-set_dd_corners(const gmx_domdec_t *dd,
-               int dim0, int dim1, int dim2,
-               gmx_bool bDistMB,
-               dd_corners_t *c)
+static void set_dd_corners(const gmx_domdec_t* dd, int dim0, int dim1, int dim2, gmx_bool bDistMB, dd_corners_t* c)
  {
-    const gmx_domdec_comm_t  *comm;
-    const gmx_domdec_zones_t *zones;
-    int i, j;
+    const gmx_domdec_comm_t*  comm;
+    const gmx_domdec_zones_t* zones;
  
      comm = dd->comm;
  
@@ -1556,22 +1496,24 @@ set_dd_corners(const gmx_domdec_t *dd,
          if (dd->ndim >= 3)
          {
              dim2 = dd->dim[2];
-            for (j = 0; j < 4; j++)
+            for (int j = 0; j < 4; j++)
              {
                  c->c[2][j] = comm->cell_x0[dim2];
              }
              if (isDlbOn(dd->comm))
              {
                  /* Use the maximum of the i-cells that see a j-cell */
-                for (i = 0; i < zones->nizone; i++)
+                for (const auto& iZone : zones->iZones)
                  {
-                    for (j = zones->izone[i].j0; j < zones->izone[i].j1; j++)
+                    const int iZoneIndex = iZone.iZoneIndex;
+                    for (int jZone : iZone.jZoneRange)
                      {
-                        if (j >= 4)
+                        if (jZone >= 4)
                          {
-                            c->c[2][j-4] =
-                                std::max(c->c[2][j-4],
-                                         comm->zone_d2[zones->shift[i][dim0]][zones->shift[i][dim1]].mch0);
+                            c->c[2][jZone - 4] = std::max(
+                                    c->c[2][jZone - 4],
+                                    comm->zone_d2[zones->shift[iZoneIndex][dim0]][zones->shift[iZoneIndex][dim1]]
+                                            .mch0);
                          }
                      }
                  }
@@ -1579,9 +1521,9 @@ set_dd_corners(const gmx_domdec_t *dd,
                  {
                      /* For the multi-body distance we need the maximum */
                      c->bc[2] = comm->cell_x0[dim2];
-                    for (i = 0; i < 2; i++)
+                    for (int i = 0; i < 2; i++)
                      {
-                        for (j = 0; j < 2; j++)
+                        for (int j = 0; j < 2; j++)
                          {
                              c->bc[2] = std::max(c->bc[2], comm->zone_d2[i][j].p1_0);
                          }
@@ -1608,33 +1550,41 @@ set_dd_corners(const gmx_domdec_t *dd,
      }
  }
  
-/*! \brief Add the atom groups we need to send in this pulse from this
- * zone to \p localAtomGroups and \p work. */
-static void
-get_zone_pulse_cgs(gmx_domdec_t *dd,
-                   int zonei, int zone,
-                   int cg0, int cg1,
-                   gmx::ArrayRef<const int> globalAtomGroupIndices,
-                   int dim, int dim_ind,
-                   int dim0, int dim1, int dim2,
-                   real r_comm2, real r_bcomm2,
-                   matrix box,
-                   bool distanceIsTriclinic,
-                   rvec *normal,
-                   real skew_fac2_d, real skew_fac_01,
-                   rvec *v_d, rvec *v_0, rvec *v_1,
-                   const dd_corners_t *c,
-                   const rvec sf2_round,
-                   gmx_bool bDistBonded,
-                   gmx_bool bBondComm,
-                   gmx_bool bDist2B,
-                   gmx_bool bDistMB,
-                   rvec *cg_cm,
-                   gmx::ArrayRef<const int> cginfo,
-                   std::vector<int>     *localAtomGroups,
-                   dd_comm_setup_work_t *work)
+/*! \brief Add the atom groups and coordinates we need to send in this
+ * pulse from this zone to \p localAtomGroups and \p work. */
+static void get_zone_pulse_groups(gmx_domdec_t*                  dd,
+                                  int                            zonei,
+                                  int                            zone,
+                                  int                            cg0,
+                                  int                            cg1,
+                                  gmx::ArrayRef<const int>       globalAtomGroupIndices,
+                                  int                            dim,
+                                  int                            dim_ind,
+                                  int                            dim0,
+                                  int                            dim1,
+                                  int                            dim2,
+                                  real                           r_comm2,
+                                  real                           r_bcomm2,
+                                  matrix                         box,
+                                  bool                           distanceIsTriclinic,
+                                  rvec*                          normal,
+                                  real                           skew_fac2_d,
+                                  real                           skew_fac_01,
+                                  rvec*                          v_d,
+                                  rvec*                          v_0,
+                                  rvec*                          v_1,
+                                  const dd_corners_t*            c,
+                                  const rvec                     sf2_round,
+                                  gmx_bool                       bDistBonded,
+                                  gmx_bool                       bBondComm,
+                                  gmx_bool                       bDist2B,
+                                  gmx_bool                       bDistMB,
+                                  gmx::ArrayRef<const gmx::RVec> coordinates,
+                                  gmx::ArrayRef<const int64_t>   atomInfo,
+                                  std::vector<int>*              localAtomGroups,
+                                  dd_comm_setup_work_t*          work)
  {
-    gmx_domdec_comm_t *comm;
+    gmx_domdec_comm_t* comm;
      gmx_bool           bScrew;
      gmx_bool           bDistMB_pulse;
      int                cg, i;
@@ -1650,8 +1600,8 @@ get_zone_pulse_cgs(gmx_domdec_t *dd,
      bDistMB_pulse = (bDistMB && bDistBonded);
  
      /* Unpack the work data */
-    std::vector<int>       &ibuf = work->atomGroupBuffer;
-    std::vector<gmx::RVec> &vbuf = work->positionBuffer;
+    std::vector<int>&       ibuf = work->atomGroupBuffer;
+    std::vector<gmx::RVec>& vbuf = work->positionBuffer;
      nsend_z                      = 0;
      nat                          = work->nat;
  
@@ -1662,17 +1612,17 @@ get_zone_pulse_cgs(gmx_domdec_t *dd,
          if (!distanceIsTriclinic)
          {
              /* Rectangular direction, easy */
-            r = cg_cm[cg][dim] - c->c[dim_ind][zone];
+            r = coordinates[cg][dim] - c->c[dim_ind][zone];
              if (r > 0)
              {
-                r2 += r*r;
+                r2 += r * r;
              }
              if (bDistMB_pulse)
              {
-                r = cg_cm[cg][dim] - c->bc[dim_ind];
+                r = coordinates[cg][dim] - c->bc[dim_ind];
                  if (r > 0)
                  {
-                    rb2 += r*r;
+                    rb2 += r * r;
                  }
              }
              /* Rounding gives at most a 16% reduction
@@ -1680,27 +1630,27 @@ get_zone_pulse_cgs(gmx_domdec_t *dd,
               */
              if (dim_ind >= 1 && (zonei == 1 || zonei == 2))
              {
-                r = cg_cm[cg][dim0] - c->cr0;
+                r = coordinates[cg][dim0] - c->cr0;
                  /* This is the first dimension, so always r >= 0 */
-                r2 += r*r;
+                r2 += r * r;
                  if (bDistMB_pulse)
                  {
-                    rb2 += r*r;
+                    rb2 += r * r;
                  }
              }
              if (dim_ind == 2 && (zonei == 2 || zonei == 3))
              {
-                r = cg_cm[cg][dim1] - c->cr1[zone];
+                r = coordinates[cg][dim1] - c->cr1[zone];
                  if (r > 0)
                  {
-                    r2 += r*r;
+                    r2 += r * r;
                  }
                  if (bDistMB_pulse)
                  {
-                    r = cg_cm[cg][dim1] - c->bcr1;
+                    r = coordinates[cg][dim1] - c->bcr1;
                      if (r > 0)
                      {
-                        rb2 += r*r;
+                        rb2 += r * r;
                      }
                  }
              }
@@ -1715,12 +1665,12 @@ get_zone_pulse_cgs(gmx_domdec_t *dd,
               */
              if (dim_ind >= 1 && (zonei == 1 || zonei == 2))
              {
-                rn[dim0] = cg_cm[cg][dim0] - c->cr0;
-                for (i = dim0+1; i < DIM; i++)
+                rn[dim0] = coordinates[cg][dim0] - c->cr0;
+                for (i = dim0 + 1; i < DIM; i++)
                  {
-                    rn[dim0] -= cg_cm[cg][i]*v_0[i][dim0];
+                    rn[dim0] -= coordinates[cg][i] * v_0[i][dim0];
                  }
-                r2 = rn[dim0]*rn[dim0]*sf2_round[dim0];
+                r2 = rn[dim0] * rn[dim0] * sf2_round[dim0];
                  if (bDistMB_pulse)
                  {
                      rb[dim0] = rn[dim0];
@@ -1734,10 +1684,10 @@ get_zone_pulse_cgs(gmx_domdec_t *dd,
                      dimd = dd->dim[i];
                      if (normal[dim0][dimd] > 0)
                      {
-                        rn[dimd] -= rn[dim0]*normal[dim0][dimd];
+                        rn[dimd] -= rn[dim0] * normal[dim0][dimd];
                          if (bDistMB_pulse)
                          {
-                            rb[dimd] -= rb[dim0]*normal[dim0][dimd];
+                            rb[dimd] -= rb[dim0] * normal[dim0][dimd];
                          }
                      }
                  }
@@ -1745,95 +1695,91 @@ get_zone_pulse_cgs(gmx_domdec_t *dd,
              if (dim_ind == 2 && (zonei == 2 || zonei == 3))
              {
                  GMX_ASSERT(dim1 >= 0 && dim1 < DIM, "Must have a valid dimension index");
-                rn[dim1] += cg_cm[cg][dim1] - c->cr1[zone];
-                tric_sh   = 0;
-                for (i = dim1+1; i < DIM; i++)
+                rn[dim1] += coordinates[cg][dim1] - c->cr1[zone];
+                tric_sh = 0;
+                for (i = dim1 + 1; i < DIM; i++)
                  {
-                    tric_sh -= cg_cm[cg][i]*v_1[i][dim1];
+                    tric_sh -= coordinates[cg][i] * v_1[i][dim1];
                  }
                  rn[dim1] += tric_sh;
                  if (rn[dim1] > 0)
                  {
-                    r2 += rn[dim1]*rn[dim1]*sf2_round[dim1];
+                    r2 += rn[dim1] * rn[dim1] * sf2_round[dim1];
                      /* Take care of coupling of the distances
                       * to the planes along dim0 and dim1 through dim2.
                       */
-                    r2 -= rn[dim0]*rn[dim1]*skew_fac_01;
+                    r2 -= rn[dim0] * rn[dim1] * skew_fac_01;
                      /* Take care that the cell planes along dim1
                       * might not be orthogonal to that along dim2.
                       */
                      if (normal[dim1][dim2] > 0)
                      {
-                        rn[dim2] -= rn[dim1]*normal[dim1][dim2];
+                        rn[dim2] -= rn[dim1] * normal[dim1][dim2];
                      }
                  }
                  if (bDistMB_pulse)
                  {
-                    rb[dim1] +=
-                        cg_cm[cg][dim1] - c->bcr1 + tric_sh;
+                    rb[dim1] += coordinates[cg][dim1] - c->bcr1 + tric_sh;
                      if (rb[dim1] > 0)
                      {
-                        rb2 += rb[dim1]*rb[dim1]*sf2_round[dim1];
+                        rb2 += rb[dim1] * rb[dim1] * sf2_round[dim1];
                          /* Take care of coupling of the distances
                           * to the planes along dim0 and dim1 through dim2.
                           */
-                        rb2 -= rb[dim0]*rb[dim1]*skew_fac_01;
+                        rb2 -= rb[dim0] * rb[dim1] * skew_fac_01;
                          /* Take care that the cell planes along dim1
                           * might not be orthogonal to that along dim2.
                           */
                          if (normal[dim1][dim2] > 0)
                          {
-                            rb[dim2] -= rb[dim1]*normal[dim1][dim2];
+                            rb[dim2] -= rb[dim1] * normal[dim1][dim2];
                          }
                      }
                  }
              }
              /* The distance along the communication direction */
-            rn[dim] += cg_cm[cg][dim] - c->c[dim_ind][zone];
-            tric_sh  = 0;
-            for (i = dim+1; i < DIM; i++)
+            rn[dim] += coordinates[cg][dim] - c->c[dim_ind][zone];
+            tric_sh = 0;
+            for (i = dim + 1; i < DIM; i++)
              {
-                tric_sh -= cg_cm[cg][i]*v_d[i][dim];
+                tric_sh -= coordinates[cg][i] * v_d[i][dim];
              }
              rn[dim] += tric_sh;
              if (rn[dim] > 0)
              {
-                r2 += rn[dim]*rn[dim]*skew_fac2_d;
+                r2 += rn[dim] * rn[dim] * skew_fac2_d;
                  /* Take care of coupling of the distances
                   * to the planes along dim0 and dim1 through dim2.
                   */
                  if (dim_ind == 1 && zonei == 1)
                  {
-                    r2 -= rn[dim0]*rn[dim]*skew_fac_01;
+                    r2 -= rn[dim0] * rn[dim] * skew_fac_01;
                  }
              }
              if (bDistMB_pulse)
              {
                  clear_rvec(rb);
                  GMX_ASSERT(dim >= 0 && dim < DIM, "Must have a valid dimension index");
-                rb[dim] += cg_cm[cg][dim] - c->bc[dim_ind] + tric_sh;
+                rb[dim] += coordinates[cg][dim] - c->bc[dim_ind] + tric_sh;
                  if (rb[dim] > 0)
                  {
-                    rb2 += rb[dim]*rb[dim]*skew_fac2_d;
+                    rb2 += rb[dim] * rb[dim] * skew_fac2_d;
                      /* Take care of coupling of the distances
                       * to the planes along dim0 and dim1 through dim2.
                       */
                      if (dim_ind == 1 && zonei == 1)
                      {
-                        rb2 -= rb[dim0]*rb[dim]*skew_fac_01;
+                        rb2 -= rb[dim0] * rb[dim] * skew_fac_01;
                      }
                  }
              }
          }
  
-        if (r2 < r_comm2 ||
-            (bDistBonded &&
-             ((bDistMB && rb2 < r_bcomm2) ||
-              (bDist2B && r2  < r_bcomm2)) &&
-             (!bBondComm ||
-              (GET_CGINFO_BOND_INTER(cginfo[cg]) &&
-               missing_link(comm->cglink, globalAtomGroupIndices[cg],
-                            comm->bLocalCG)))))
+        if (r2 < r_comm2
+            || (bDistBonded && ((bDistMB && rb2 < r_bcomm2) || (bDist2B && r2 < r_bcomm2))
+                && (!bBondComm
+                    || ((atomInfo[cg] & gmx::sc_atomInfo_BondCommunication)
+                        && missing_link(*comm->bondedLinks, globalAtomGroupIndices[cg], *dd->ga2la)))))
          {
              /* Store the local and global atom group indices and position */
              localAtomGroups->push_back(cg);
@@ -1843,8 +1789,8 @@ get_zone_pulse_cgs(gmx_domdec_t *dd,
              rvec posPbc;
              if (dd->ci[dim] == 0)
              {
-                /* Correct cg_cm for pbc */
-                rvec_add(cg_cm[cg], box[dim], posPbc);
+                /* Correct coordinates for pbc */
+                rvec_add(coordinates[cg], box[dim], posPbc);
                  if (bScrew)
                  {
                      posPbc[YY] = box[YY][YY] - posPbc[YY];
@@ -1853,7 +1799,7 @@ get_zone_pulse_cgs(gmx_domdec_t *dd,
              }
              else
              {
-                copy_rvec(cg_cm[cg], posPbc);
+                copy_rvec(coordinates[cg], posPbc);
              }
              vbuf.emplace_back(posPbc[XX], posPbc[YY], posPbc[ZZ]);
  
@@ -1866,7 +1812,7 @@ get_zone_pulse_cgs(gmx_domdec_t *dd,
  }
  
  //! Clear data.
-static void clearCommSetupData(dd_comm_setup_work_t *work)
+static void clearCommSetupData(dd_comm_setup_work_t* work)
  {
      work->localAtomGroupBuffer.clear();
      work->atomGroupBuffer.clear();
@@ -1876,23 +1822,18 @@ static void clearCommSetupData(dd_comm_setup_work_t *work)
  }
  
  //! Prepare DD communication.
-static void setup_dd_communication(gmx_domdec_t *dd,
-                                   matrix box, gmx_ddbox_t *ddbox,
-                                   t_forcerec *fr,
-                                   t_state *state,
-                                   PaddedVector<gmx::RVec> *f)
+static void setup_dd_communication(gmx_domdec_t* dd, matrix box, gmx_ddbox_t* ddbox, t_forcerec* fr, t_state* state)
  {
      int                    dim_ind, dim, dim0, dim1, dim2, dimd, nat_tot;
      int                    nzone, nzone_send, zone, zonei, cg0, cg1;
-    int                    c, i, cg, cg_gl;
-    int                   *zone_cg_range, pos_cg;
-    gmx_domdec_comm_t     *comm;
-    gmx_domdec_zones_t    *zones;
-    gmx_domdec_comm_dim_t *cd;
-    cginfo_mb_t           *cginfo_mb;
+    int                    c;
+    int *                  zone_cg_range, pos_cg;
+    gmx_domdec_comm_t*     comm;
+    gmx_domdec_zones_t*    zones;
+    gmx_domdec_comm_dim_t* cd;
      gmx_bool               bBondComm, bDist2B, bDistMB, bDistBonded;
      dd_corners_t           corners;
-    rvec                  *normal, *v_d, *v_0 = nullptr, *v_1 = nullptr;
+    rvec *                 normal, *v_d, *v_0 = nullptr, *v_1 = nullptr;
      real                   skew_fac2_d, skew_fac_01;
      rvec                   sf2_round;
  
@@ -1901,7 +1842,7 @@ static void setup_dd_communication(gmx_domdec_t *dd,
          fprintf(debug, "Setting up DD communication\n");
      }
  
-    comm  = dd->comm;
+    comm = dd->comm;
  
      if (comm->dth.empty())
      {
@@ -1909,11 +1850,11 @@ static void setup_dd_communication(gmx_domdec_t *dd,
           * This can not be done in init_domain_decomposition,
           * as the numbers of threads is determined later.
           */
-        int numThreads = gmx_omp_nthreads_get(emntDomdec);
+        int numThreads = gmx_omp_nthreads_get(ModuleMultiThread::Domdec);
          comm->dth.resize(numThreads);
      }
  
-    bBondComm = comm->bBondComm;
+    bBondComm = comm->systemInfo.filterBondedCommunication;
  
      /* Do we need to determine extra distances for multi-body bondeds? */
      bDistMB = (comm->systemInfo.haveInterDomainMultiBodyBondeds && isDlbOn(dd->comm) && dd->ndim > 1);
@@ -1921,8 +1862,10 @@ static void setup_dd_communication(gmx_domdec_t *dd,
      /* Do we need to determine extra distances for only two-body bondeds? */
      bDist2B = (bBondComm && !bDistMB);
  
-    const real r_comm2  = gmx::square(domainToDomainIntoAtomToDomainCutoff(comm->systemInfo, comm->systemInfo.cutoff));
-    const real r_bcomm2 = gmx::square(domainToDomainIntoAtomToDomainCutoff(comm->systemInfo, comm->cutoff_mbody));
+    const real r_comm2 =
+            gmx::square(domainToDomainIntoAtomToDomainCutoff(comm->systemInfo, comm->systemInfo.cutoff));
+    const real r_bcomm2 =
+            gmx::square(domainToDomainIntoAtomToDomainCutoff(comm->systemInfo, comm->cutoff_mbody));
  
      if (debug)
      {
@@ -1949,8 +1892,7 @@ static void setup_dd_communication(gmx_domdec_t *dd,
               * to the cell planes along dim0 and dim1 through dim2.
               * This is required for correct rounding.
               */
-            skew_fac_01 =
-                ddbox->v[dim0][dim1+1][dim0]*ddbox->v[dim1][dim1+1][dim1];
+            skew_fac_01 = ddbox->v[dim0][dim1 + 1][dim0] * ddbox->v[dim1][dim1 + 1][dim1];
              if (debug)
              {
                  fprintf(debug, "\nskew_fac_01 %f\n", skew_fac_01);
@@ -1962,13 +1904,14 @@ static void setup_dd_communication(gmx_domdec_t *dd,
          v_1 = ddbox->v[dim1];
      }
  
-    zone_cg_range = zones->cg_range;
-    cginfo_mb     = fr->cginfo_mb;
+    zone_cg_range = zones->cg_range.data();
+    gmx::ArrayRef<gmx::AtomInfoWithinMoleculeBlock> atomInfoForEachMoleculeBlock =
+            fr->atomInfoForEachMoleculeBlock;
  
      zone_cg_range[0]   = 0;
-    zone_cg_range[1]   = dd->ncg_home;
-    comm->zone_ncg1[0] = dd->ncg_home;
-    pos_cg             = dd->ncg_home;
+    zone_cg_range[1]   = dd->numHomeAtoms;
+    comm->zone_ncg1[0] = dd->numHomeAtoms;
+    pos_cg             = dd->numHomeAtoms;
  
      nat_tot = comm->atomRanges.numHomeAtoms();
      nzone   = 1;
@@ -1979,7 +1922,7 @@ static void setup_dd_communication(gmx_domdec_t *dd,
  
          /* Check if we need to compute triclinic distances along this dim */
          bool distanceIsTriclinic = false;
-        for (i = 0; i <= dim_ind; i++)
+        for (int i = 0; i <= dim_ind; i++)
          {
              if (ddbox->tric_dir[dd->dim[i]])
              {
@@ -1997,8 +1940,8 @@ static void setup_dd_communication(gmx_domdec_t *dd,
              nzone_send = nzone;
          }
  
-        v_d                = ddbox->v[dim];
-        skew_fac2_d        = gmx::square(ddbox->skew_fac[dim]);
+        v_d         = ddbox->v[dim];
+        skew_fac2_d = gmx::square(ddbox->skew_fac[dim]);
  
          cd->receiveInPlace = true;
          for (int p = 0; p < cd->numPulses(); p++)
@@ -2008,7 +1951,7 @@ static void setup_dd_communication(gmx_domdec_t *dd,
               */
              bDistBonded = ((bDistMB || bDist2B) && p == 0);
  
-            gmx_domdec_ind_t *ind = &cd->ind[p];
+            gmx_domdec_ind_t* ind = &cd->ind[p];
  
              /* Thread 0 writes in the global index array */
              ind->index.clear();
@@ -2028,20 +1971,18 @@ static void setup_dd_communication(gmx_domdec_t *dd,
                          sf2_round[dimd] = 1;
                          if (ddbox->tric_dir[dimd])
                          {
-                            for (i = dd->dim[dimd]+1; i < DIM; i++)
+                            for (int i = dd->dim[dimd] + 1; i < DIM; i++)
                              {
                                  /* If we are shifted in dimension i
                                   * and the cell plane is tilted forward
                                   * in dimension i, skip this coupling.
                                   */
-                                if (!(zones->shift[nzone+zone][i] &&
-                                      ddbox->v[dimd][i][dimd] >= 0))
+                                if (!(zones->shift[nzone + zone][i] && ddbox->v[dimd][i][dimd] >= 0))
                                  {
-                                    sf2_round[dimd] +=
-                                        gmx::square(ddbox->v[dimd][i][dimd]);
+                                    sf2_round[dimd] += gmx::square(ddbox->v[dimd][i][dimd]);
                                  }
                              }
-                            sf2_round[dimd] = 1/sf2_round[dimd];
+                            sf2_round[dimd] = 1 / sf2_round[dimd];
                          }
                      }
                  }
@@ -2053,14 +1994,14 @@ static void setup_dd_communication(gmx_domdec_t *dd,
                       * for neighbor searching
                       */
                      cg0 = zone_cg_range[zonei];
-                    cg1 = zone_cg_range[zonei+1];
+                    cg1 = zone_cg_range[zonei + 1];
                  }
                  else
                  {
                      /* Look only at the cg's received in the previous grid pulse
                       */
-                    cg1 = zone_cg_range[nzone+zone+1];
-                    cg0 = cg1 - cd->ind[p-1].nrecv[zone];
+                    cg1 = zone_cg_range[nzone + zone + 1];
+                    cg0 = cg1 - cd->ind[p - 1].nrecv[zone];
                  }
  
                  const int numThreads = gmx::ssize(comm->dth);
@@ -2069,7 +2010,7 @@ static void setup_dd_communication(gmx_domdec_t *dd,
                  {
                      try
                      {
-                        dd_comm_setup_work_t &work = comm->dth[th];
+                        dd_comm_setup_work_t& work = comm->dth[th];
  
                          /* Retain data accumulated into buffers of thread 0 */
                          if (th > 0)
@@ -2077,38 +2018,60 @@ static void setup_dd_communication(gmx_domdec_t *dd,
                              clearCommSetupData(&work);
                          }
  
-                        int cg0_th = cg0 + ((cg1 - cg0)* th   )/numThreads;
-                        int cg1_th = cg0 + ((cg1 - cg0)*(th+1))/numThreads;
-
-                        /* Get the cg's for this pulse in this zone */
-                        get_zone_pulse_cgs(dd, zonei, zone, cg0_th, cg1_th,
-                                           dd->globalAtomGroupIndices,
-                                           dim, dim_ind, dim0, dim1, dim2,
-                                           r_comm2, r_bcomm2,
-                                           box, distanceIsTriclinic,
-                                           normal, skew_fac2_d, skew_fac_01,
-                                           v_d, v_0, v_1, &corners, sf2_round,
-                                           bDistBonded, bBondComm,
-                                           bDist2B, bDistMB,
-                                           state->x.rvec_array(),
-                                           fr->cginfo,
-                                           th == 0 ? &ind->index : &work.localAtomGroupBuffer,
-                                           &work);
+                        int cg0_th = cg0 + ((cg1 - cg0) * th) / numThreads;
+                        int cg1_th = cg0 + ((cg1 - cg0) * (th + 1)) / numThreads;
+
+                        /* Get the atom groups and coordinates for this pulse in this zone */
+                        get_zone_pulse_groups(dd,
+                                              zonei,
+                                              zone,
+                                              cg0_th,
+                                              cg1_th,
+                                              dd->globalAtomGroupIndices,
+                                              dim,
+                                              dim_ind,
+                                              dim0,
+                                              dim1,
+                                              dim2,
+                                              r_comm2,
+                                              r_bcomm2,
+                                              box,
+                                              distanceIsTriclinic,
+                                              normal,
+                                              skew_fac2_d,
+                                              skew_fac_01,
+                                              v_d,
+                                              v_0,
+                                              v_1,
+                                              &corners,
+                                              sf2_round,
+                                              bDistBonded,
+                                              bBondComm,
+                                              bDist2B,
+                                              bDistMB,
+                                              state->x,
+                                              fr->atomInfo,
+                                              th == 0 ? &ind->index : &work.localAtomGroupBuffer,
+                                              &work);
                      }
-                    GMX_CATCH_ALL_AND_EXIT_WITH_FATAL_ERROR;
+                    GMX_CATCH_ALL_AND_EXIT_WITH_FATAL_ERROR
                  } // END
  
-                std::vector<int>       &atomGroups = comm->dth[0].atomGroupBuffer;
-                std::vector<gmx::RVec> &positions  = comm->dth[0].positionBuffer;
-                ind->nsend[zone]  = comm->dth[0].nsend_zone;
+                std::vector<int>&       atomGroups = comm->dth[0].atomGroupBuffer;
+                std::vector<gmx::RVec>& positions  = comm->dth[0].positionBuffer;
+                ind->nsend[zone]                   = comm->dth[0].nsend_zone;
                  /* Append data of threads>=1 to the communication buffers */
                  for (int th = 1; th < numThreads; th++)
                  {
-                    const dd_comm_setup_work_t &dth = comm->dth[th];
+                    const dd_comm_setup_work_t& dth = comm->dth[th];
  
-                    ind->index.insert(ind->index.end(), dth.localAtomGroupBuffer.begin(), dth.localAtomGroupBuffer.end());
-                    atomGroups.insert(atomGroups.end(), dth.atomGroupBuffer.begin(), dth.atomGroupBuffer.end());
-                    positions.insert(positions.end(), dth.positionBuffer.begin(), dth.positionBuffer.end());
+                    ind->index.insert(ind->index.end(),
+                                      dth.localAtomGroupBuffer.begin(),
+                                      dth.localAtomGroupBuffer.end());
+                    atomGroups.insert(
+                            atomGroups.end(), dth.atomGroupBuffer.begin(), dth.atomGroupBuffer.end());
+                    positions.insert(
+                            positions.end(), dth.positionBuffer.begin(), dth.positionBuffer.end());
                      comm->dth[0].nat += dth.nat;
                      ind->nsend[zone] += dth.nsend_zone;
                  }
@@ -2121,14 +2084,12 @@ static void setup_dd_communication(gmx_domdec_t *dd,
              ind->nsend[nzone]     = ind->index.size();
              ind->nsend[nzone + 1] = comm->dth[0].nat;
              /* Communicate the number of cg's and atoms to receive */
-            ddSendrecv(dd, dim_ind, dddirBackward,
-                       ind->nsend, nzone+2,
-                       ind->nrecv, nzone+2);
+            ddSendrecv(dd, dim_ind, dddirBackward, ind->nsend, nzone + 2, ind->nrecv, nzone + 2);
  
              if (p > 0)
              {
                  /* We can receive in place if only the last zone is not empty */
-                for (zone = 0; zone < nzone-1; zone++)
+                for (zone = 0; zone < nzone - 1; zone++)
                  {
                      if (ind->nrecv[zone] > 0)
                      {
@@ -2146,7 +2107,7 @@ static void setup_dd_communication(gmx_domdec_t *dd,
              DDBufferAccess<int>       globalAtomGroupBuffer(comm->intBuffer, receiveBufferSize);
              DDBufferAccess<gmx::RVec> rvecBuffer(comm->rvecBuffer, receiveBufferSize);
  
-            dd_comm_setup_work_t     &work = comm->dth[0];
+            dd_comm_setup_work_t& work = comm->dth[0];
  
              /* Make space for the global cg indices */
              int numAtomGroupsNew = pos_cg + ind->nrecv[nzone];
@@ -2155,17 +2116,17 @@ static void setup_dd_communication(gmx_domdec_t *dd,
              gmx::ArrayRef<int> integerBufferRef;
              if (cd->receiveInPlace)
              {
-                integerBufferRef = gmx::arrayRefFromArray(dd->globalAtomGroupIndices.data() + pos_cg, ind->nrecv[nzone]);
+                integerBufferRef = gmx::arrayRefFromArray(
+                        dd->globalAtomGroupIndices.data() + pos_cg, ind->nrecv[nzone]);
              }
              else
              {
                  integerBufferRef = globalAtomGroupBuffer.buffer;
              }
-            ddSendrecv<int>(dd, dim_ind, dddirBackward,
-                            work.atomGroupBuffer, integerBufferRef);
+            ddSendrecv<int>(dd, dim_ind, dddirBackward, work.atomGroupBuffer, integerBufferRef);
  
-            /* Make space for cg_cm */
-            dd_check_alloc_ncg(fr, state, f, pos_cg + ind->nrecv[nzone]);
+            /* Make space for atominfo */
+            dd_resize_atominfo_and_state(fr, state, pos_cg + ind->nrecv[nzone]);
  
              /* Communicate the coordinates */
              gmx::ArrayRef<gmx::RVec> rvecBufferRef;
@@ -2177,8 +2138,7 @@ static void setup_dd_communication(gmx_domdec_t *dd,
              {
                  rvecBufferRef = rvecBuffer.buffer;
              }
-            ddSendrecv<gmx::RVec>(dd, dim_ind, dddirBackward,
-                                  work.positionBuffer, rvecBufferRef);
+            ddSendrecv<gmx::RVec>(dd, dim_ind, dddirBackward, work.positionBuffer, rvecBufferRef);
  
              /* Make the charge group index */
              if (cd->receiveInPlace)
@@ -2186,37 +2146,37 @@ static void setup_dd_communication(gmx_domdec_t *dd,
                  zone = (p == 0 ? 0 : nzone - 1);
                  while (zone < nzone)
                  {
-                    for (cg = 0; cg < ind->nrecv[zone]; cg++)
+                    for (int i = 0; i < ind->nrecv[zone]; i++)
                      {
-                        cg_gl                              = dd->globalAtomGroupIndices[pos_cg];
-                        fr->cginfo[pos_cg]                 = ddcginfo(cginfo_mb, cg_gl);
-                        if (bBondComm)
-                        {
-                            /* Update the charge group presence,
-                             * so we can use it in the next pass of the loop.
-                             */
-                            comm->bLocalCG[cg_gl] = TRUE;
-                        }
+                        int globalAtomIndex = dd->globalAtomGroupIndices[pos_cg];
+                        fr->atomInfo[pos_cg] =
+                                ddGetAtomInfo(atomInfoForEachMoleculeBlock, globalAtomIndex);
                          pos_cg++;
                      }
                      if (p == 0)
                      {
-                        comm->zone_ncg1[nzone+zone] = ind->nrecv[zone];
+                        comm->zone_ncg1[nzone + zone] = ind->nrecv[zone];
                      }
                      zone++;
-                    zone_cg_range[nzone+zone] = pos_cg;
+                    zone_cg_range[nzone + zone] = pos_cg;
                  }
              }
              else
              {
                  /* This part of the code is never executed with bBondComm. */
-                merge_cg_buffers(nzone, cd, p, zone_cg_range,
-                                 dd->globalAtomGroupIndices, integerBufferRef.data(),
-                                 state->x, rvecBufferRef,
-                                 fr->cginfo_mb, fr->cginfo);
+                merge_cg_buffers(nzone,
+                                 cd,
+                                 p,
+                                 zone_cg_range,
+                                 dd->globalAtomGroupIndices,
+                                 integerBufferRef.data(),
+                                 state->x,
+                                 rvecBufferRef,
+                                 fr->atomInfoForEachMoleculeBlock,
+                                 fr->atomInfo);
                  pos_cg += ind->nrecv[nzone];
              }
-            nat_tot += ind->nrecv[nzone+1];
+            nat_tot += ind->nrecv[nzone + 1];
          }
          if (!cd->receiveInPlace)
          {
@@ -2230,12 +2190,11 @@ static void setup_dd_communication(gmx_domdec_t *dd,
  
      if (!bBondComm)
      {
-        /* We don't need to update cginfo, since that was alrady done above.
+        /* We don't need to update atominfo, since that was already done above.
           * So we pass NULL for the forcerec.
           */
-        dd_set_cginfo(dd->globalAtomGroupIndices,
-                      dd->ncg_home, dd->globalAtomGroupIndices.size(),
-                      nullptr, comm->bLocalCG);
+        dd_set_atominfo(
+                dd->globalAtomGroupIndices, dd->numHomeAtoms, dd->globalAtomGroupIndices.size(), nullptr);
      }
  
      if (debug)
@@ -2243,22 +2202,20 @@ static void setup_dd_communication(gmx_domdec_t *dd,
          fprintf(debug, "Finished setting up DD communication, zones:");
          for (c = 0; c < zones->n; c++)
          {
-            fprintf(debug, " %d", zones->cg_range[c+1]-zones->cg_range[c]);
+            fprintf(debug, " %d", zones->cg_range[c + 1] - zones->cg_range[c]);
          }
          fprintf(debug, "\n");
      }
  }
  
  //! Set boundaries for the charge group range.
-static void set_cg_boundaries(gmx_domdec_zones_t *zones)
+static void set_cg_boundaries(gmx_domdec_zones_t* zones)
  {
-    int c;
-
-    for (c = 0; c < zones->nizone; c++)
+    for (auto& iZone : zones->iZones)
      {
-        zones->izone[c].cg1  = zones->cg_range[c+1];
-        zones->izone[c].jcg0 = zones->cg_range[zones->izone[c].j0];
-        zones->izone[c].jcg1 = zones->cg_range[zones->izone[c].j1];
+        iZone.iAtomRange = gmx::Range<int>(0, zones->cg_range[iZone.iZoneIndex + 1]);
+        iZone.jAtomRange = gmx::Range<int>(zones->cg_range[iZone.jZoneRange.begin()],
+                                           zones->cg_range[iZone.jZoneRange.end()]);
      }
  }
  
@@ -2278,15 +2235,17 @@ static void set_cg_boundaries(gmx_domdec_zones_t *zones)
   * \param[in]     zone_end    The end of the zone range to set sizes for
   * \param[in]     numMovedChargeGroupsInHomeZone  The number of charge groups in the home zone that should moved but are still present in dd->comm->zones.cg_range
   */
-static void set_zones_size(gmx_domdec_t *dd,
-                           matrix box, const gmx_ddbox_t *ddbox,
-                           int zone_start, int zone_end,
-                           int numMovedChargeGroupsInHomeZone)
+static void set_zones_size(gmx_domdec_t*      dd,
+                           matrix             box,
+                           const gmx_ddbox_t* ddbox,
+                           int                zone_start,
+                           int                zone_end,
+                           int                numMovedChargeGroupsInHomeZone)
  {
-    gmx_domdec_comm_t  *comm;
-    gmx_domdec_zones_t *zones;
+    gmx_domdec_comm_t*  comm;
+    gmx_domdec_zones_t* zones;
      gmx_bool            bDistMB;
-    int                 z, zi, d, dim;
+    int                 z, d, dim;
      real                rcs, rcmbs;
      int                 i, j;
      real                vol;
@@ -2296,9 +2255,7 @@ static void set_zones_size(gmx_domdec_t *dd,
      zones = &comm->zones;
  
      /* Do we need to determine extra distances for multi-body bondeds? */
-    bDistMB = (comm->systemInfo.haveInterDomainMultiBodyBondeds &&
-               isDlbOn(dd->comm) &&
-               dd->ndim > 1);
+    bDistMB = (comm->systemInfo.haveInterDomainMultiBodyBondeds && isDlbOn(dd->comm) && dd->ndim > 1);
  
      for (z = zone_start; z < zone_end; z++)
      {
@@ -2322,13 +2279,17 @@ static void set_zones_size(gmx_domdec_t *dd,
              {
                  if (d == 1)
                  {
-                    zones->size[z].x0[dim] = comm->zone_d1[zones->shift[z][dd->dim[d-1]]].min0;
-                    zones->size[z].x1[dim] = comm->zone_d1[zones->shift[z][dd->dim[d-1]]].max1;
+                    zones->size[z].x0[dim] = comm->zone_d1[zones->shift[z][dd->dim[d - 1]]].min0;
+                    zones->size[z].x1[dim] = comm->zone_d1[zones->shift[z][dd->dim[d - 1]]].max1;
                  }
                  else if (d == 2)
                  {
-                    zones->size[z].x0[dim] = comm->zone_d2[zones->shift[z][dd->dim[d-2]]][zones->shift[z][dd->dim[d-1]]].min0;
-                    zones->size[z].x1[dim] = comm->zone_d2[zones->shift[z][dd->dim[d-2]]][zones->shift[z][dd->dim[d-1]]].max1;
+                    zones->size[z].x0[dim] =
+                            comm->zone_d2[zones->shift[z][dd->dim[d - 2]]][zones->shift[z][dd->dim[d - 1]]]
+                                    .min0;
+                    zones->size[z].x1[dim] =
+                            comm->zone_d2[zones->shift[z][dd->dim[d - 2]]][zones->shift[z][dd->dim[d - 1]]]
+                                    .max1;
                  }
              }
          }
@@ -2337,7 +2298,7 @@ static void set_zones_size(gmx_domdec_t *dd,
          rcmbs = comm->cutoff_mbody;
          if (ddbox->tric_dir[dim])
          {
-            rcs   /= ddbox->skew_fac[dim];
+            rcs /= ddbox->skew_fac[dim];
              rcmbs /= ddbox->skew_fac[dim];
          }
  
@@ -2359,20 +2320,19 @@ static void set_zones_size(gmx_domdec_t *dd,
                       */
                      if (z < 4)
                      {
-                        zones->size[z].x0[dim] =
-                            comm->zone_d1[zones->shift[z][dd->dim[d-1]]].min1;
+                        zones->size[z].x0[dim] = comm->zone_d1[zones->shift[z][dd->dim[d - 1]]].min1;
                      }
                      else
                      {
                          if (d == 1)
                          {
-                            zones->size[z].x0[dim] =
-                                zones->size[zone_perm[2][z-4]].x0[dim];
+                            zones->size[z].x0[dim] = zones->size[zone_perm[2][z - 4]].x0[dim];
                          }
                          else
                          {
                              zones->size[z].x0[dim] =
-                                comm->zone_d2[zones->shift[z][dd->dim[d-2]]][zones->shift[z][dd->dim[d-1]]].min1;
+                                    comm->zone_d2[zones->shift[z][dd->dim[d - 2]]][zones->shift[z][dd->dim[d - 1]]]
+                                            .min1;
                          }
                      }
                      /* A temporary limit, is updated below */
@@ -2380,7 +2340,7 @@ static void set_zones_size(gmx_domdec_t *dd,
  
                      if (bDistMB)
                      {
-                        for (zi = 0; zi < zones->nizone; zi++)
+                        for (size_t zi = 0; zi < zones->iZones.size(); zi++)
                          {
                              if (zones->shift[zi][dim] == 0)
                              {
@@ -2389,7 +2349,7 @@ static void set_zones_size(gmx_domdec_t *dd,
                                   * to a larger zone then strictly necessary.
                                   */
                                  zones->size[z].x1[dim] = std::max(zones->size[z].x1[dim],
-                                                                  zones->size[zi].x1[dim]+rcmbs);
+                                                                  zones->size[zi].x1[dim] + rcmbs);
                              }
                          }
                      }
@@ -2400,18 +2360,25 @@ static void set_zones_size(gmx_domdec_t *dd,
          /* Loop over the i-zones to set the upper limit of each
           * j-zone they see.
           */
-        for (zi = 0; zi < zones->nizone; zi++)
+        for (const auto& iZone : zones->iZones)
          {
+            const int zi = iZone.iZoneIndex;
              if (zones->shift[zi][dim] == 0)
              {
                  /* We should only use zones up to zone_end */
-                int jZoneEnd = std::min(zones->izone[zi].j1, zone_end);
-                for (z = zones->izone[zi].j0; z < jZoneEnd; z++)
+                const auto& jZoneRangeFull = iZone.jZoneRange;
+                if (zone_end <= *jZoneRangeFull.begin())
                  {
-                    if (zones->shift[z][dim] > 0)
+                    continue;
+                }
+                const gmx::Range<int> jZoneRange(*jZoneRangeFull.begin(),
+                                                 std::min(*jZoneRangeFull.end(), zone_end));
+                for (int jZone : jZoneRange)
+                {
+                    if (zones->shift[jZone][dim] > 0)
                      {
-                        zones->size[z].x1[dim] = std::max(zones->size[z].x1[dim],
-                                                          zones->size[zi].x1[dim]+rcs);
+                        zones->size[jZone].x1[dim] =
+                                std::max(zones->size[jZone].x1[dim], zones->size[zi].x1[dim] + rcs);
                      }
                  }
              }
@@ -2421,7 +2388,7 @@ static void set_zones_size(gmx_domdec_t *dd,
      for (z = zone_start; z < zone_end; z++)
      {
          /* Initialization only required to keep the compiler happy */
-        rvec corner_min = {0, 0, 0}, corner_max = {0, 0, 0}, corner;
+        rvec corner_min = { 0, 0, 0 }, corner_max = { 0, 0, 0 }, corner;
          int  nc, c;
  
          /* To determine the bounding box for a zone we need to find
@@ -2449,8 +2416,8 @@ static void set_zones_size(gmx_domdec_t *dd,
              {
                  corner[ZZ] = zones->size[z].x1[ZZ];
              }
-            if (dd->ndim == 1 && dd->dim[0] < ZZ && ZZ < dd->unitCellInfo.npbcdim &&
-                box[ZZ][1 - dd->dim[0]] != 0)
+            if (dd->ndim == 1 && dd->dim[0] < ZZ && ZZ < dd->unitCellInfo.npbcdim
+                && box[ZZ][1 - dd->dim[0]] != 0)
              {
                  /* With 1D domain decomposition the cg's are not in
                   * the triclinic box, but triclinic x-y and rectangular y/x-z.
@@ -2461,14 +2428,14 @@ static void set_zones_size(gmx_domdec_t *dd,
                   */
                  int d = 1 - dd->dim[0];
  
-                corner[d] -= corner[ZZ]*box[ZZ][d]/box[ZZ][ZZ];
+                corner[d] -= corner[ZZ] * box[ZZ][d] / box[ZZ][ZZ];
              }
              /* Apply the triclinic couplings */
              for (i = YY; i < ddbox->npbcdim && i < DIM; i++)
              {
                  for (j = XX; j < i; j++)
                  {
-                    corner[j] += corner[i]*box[i][j]/box[i][i];
+                    corner[j] += corner[i] * box[i][j] / box[i][i];
                  }
              }
              if (c == 0)
@@ -2503,23 +2470,32 @@ static void set_zones_size(gmx_domdec_t *dd,
          {
              vol *= zones->size[0].x1[dim] - zones->size[0].x0[dim];
          }
-        zones->dens_zone0 = (zones->cg_range[1] - zones->cg_range[0] - numMovedChargeGroupsInHomeZone)/vol;
+        zones->dens_zone0 =
+                (zones->cg_range[1] - zones->cg_range[0] - numMovedChargeGroupsInHomeZone) / vol;
      }
  
      if (debug)
      {
          for (z = zone_start; z < zone_end; z++)
          {
-            fprintf(debug, "zone %d    %6.3f - %6.3f  %6.3f - %6.3f  %6.3f - %6.3f\n",
+            fprintf(debug,
+                    "zone %d    %6.3f - %6.3f  %6.3f - %6.3f  %6.3f - %6.3f\n",
                      z,
-                    zones->size[z].x0[XX], zones->size[z].x1[XX],
-                    zones->size[z].x0[YY], zones->size[z].x1[YY],
-                    zones->size[z].x0[ZZ], zones->size[z].x1[ZZ]);
-            fprintf(debug, "zone %d bb %6.3f - %6.3f  %6.3f - %6.3f  %6.3f - %6.3f\n",
+                    zones->size[z].x0[XX],
+                    zones->size[z].x1[XX],
+                    zones->size[z].x0[YY],
+                    zones->size[z].x1[YY],
+                    zones->size[z].x0[ZZ],
+                    zones->size[z].x1[ZZ]);
+            fprintf(debug,
+                    "zone %d bb %6.3f - %6.3f  %6.3f - %6.3f  %6.3f - %6.3f\n",
                      z,
-                    zones->size[z].bb_x0[XX], zones->size[z].bb_x1[XX],
-                    zones->size[z].bb_x0[YY], zones->size[z].bb_x1[YY],
-                    zones->size[z].bb_x0[ZZ], zones->size[z].bb_x1[ZZ]);
+                    zones->size[z].bb_x0[XX],
+                    zones->size[z].bb_x1[XX],
+                    zones->size[z].bb_x0[YY],
+                    zones->size[z].bb_x1[YY],
+                    zones->size[z].bb_x0[ZZ],
+                    zones->size[z].bb_x1[ZZ]);
          }
      }
  }
@@ -2528,25 +2504,24 @@ static void set_zones_size(gmx_domdec_t *dd,
   *
   * Note: both buffers should have at least \p sort.size() elements.
   */
-template <typename T>
-static void
-orderVector(gmx::ArrayRef<const gmx_cgsort_t>  sort,
-            gmx::ArrayRef<T>                   dataToSort,
-            gmx::ArrayRef<T>                   sortBuffer)
+template<typename T>
+static void orderVector(gmx::ArrayRef<const gmx_cgsort_t> sort,
+                        gmx::ArrayRef<T>                  dataToSort,
+                        gmx::ArrayRef<T>                  sortBuffer)
  {
      GMX_ASSERT(dataToSort.size() >= sort.size(), "The vector needs to be sufficiently large");
-    GMX_ASSERT(sortBuffer.size() >= sort.size(), "The sorting buffer needs to be sufficiently large");
+    GMX_ASSERT(sortBuffer.size() >= sort.size(),
+               "The sorting buffer needs to be sufficiently large");
  
      /* Order the data into the temporary buffer */
      size_t i = 0;
-    for (const gmx_cgsort_t &entry : sort)
+    for (const gmx_cgsort_t& entry : sort)
      {
          sortBuffer[i++] = dataToSort[entry.ind];
      }
  
      /* Copy back to the original array */
-    std::copy(sortBuffer.begin(), sortBuffer.begin() + sort.size(),
-              dataToSort.begin());
+    std::copy(sortBuffer.begin(), sortBuffer.begin() + sort.size(), dataToSort.begin());
  }
  
  /*! \brief Order data in \p dataToSort according to \p sort
@@ -2554,11 +2529,10 @@ orderVector(gmx::ArrayRef<const gmx_cgsort_t>  sort,
   * Note: \p vectorToSort should have at least \p sort.size() elements,
   *       \p workVector is resized when it is too small.
   */
-template <typename T>
-static void
-orderVector(gmx::ArrayRef<const gmx_cgsort_t>  sort,
-            gmx::ArrayRef<T>                   vectorToSort,
-            std::vector<T>                    *workVector)
+template<typename T>
+static void orderVector(gmx::ArrayRef<const gmx_cgsort_t> sort,
+                        gmx::ArrayRef<T>                  vectorToSort,
+                        std::vector<T>*                   workVector)
  {
      if (gmx::index(workVector->size()) < sort.ssize())
      {
@@ -2568,8 +2542,7 @@ orderVector(gmx::ArrayRef<const gmx_cgsort_t>  sort,
  }
  
  //! Returns the sorting order for atoms based on the nbnxn grid order in sort
-static void dd_sort_order_nbnxn(const t_forcerec          *fr,
-                                std::vector<gmx_cgsort_t> *sort)
+static void dd_sort_order_nbnxn(const t_forcerec* fr, std::vector<gmx_cgsort_t>* sort)
  {
      gmx::ArrayRef<const int> atomOrder = fr->nbv->getLocalAtomOrder();
  
@@ -2589,68 +2562,67 @@ static void dd_sort_order_nbnxn(const t_forcerec          *fr,
  }
  
  //! Returns the sorting state for DD.
-static void dd_sort_state(gmx_domdec_t *dd, t_forcerec *fr, t_state *state)
+static void dd_sort_state(gmx_domdec_t* dd, t_forcerec* fr, t_state* state)
  {
-    gmx_domdec_sort_t *sort = dd->comm->sort.get();
+    gmx_domdec_sort_t* sort = dd->comm->sort.get();
  
      dd_sort_order_nbnxn(fr, &sort->sorted);
  
      /* We alloc with the old size, since cgindex is still old */
-    DDBufferAccess<gmx::RVec>     rvecBuffer(dd->comm->rvecBuffer, dd->ncg_home);
+    DDBufferAccess<gmx::RVec> rvecBuffer(dd->comm->rvecBuffer, dd->numHomeAtoms);
  
      /* Set the new home atom/charge group count */
-    dd->ncg_home = sort->sorted.size();
+    dd->numHomeAtoms = sort->sorted.size();
      if (debug)
      {
-        fprintf(debug, "Set the new home atom count to %d\n",
-                dd->ncg_home);
+        fprintf(debug, "Set the new home atom count to %d\n", dd->numHomeAtoms);
      }
  
      /* Reorder the state */
      gmx::ArrayRef<const gmx_cgsort_t> cgsort = sort->sorted;
-    GMX_RELEASE_ASSERT(cgsort.ssize() == dd->ncg_home, "We should sort all the home atom groups");
+    GMX_RELEASE_ASSERT(cgsort.ssize() == dd->numHomeAtoms,
+                       "We should sort all the home atom groups");
  
-    if (state->flags & (1 << estX))
+    if (state->flags & enumValueToBitMask(StateEntry::X))
      {
          orderVector(cgsort, makeArrayRef(state->x), rvecBuffer.buffer);
      }
-    if (state->flags & (1 << estV))
+    if (state->flags & enumValueToBitMask(StateEntry::V))
      {
          orderVector(cgsort, makeArrayRef(state->v), rvecBuffer.buffer);
      }
-    if (state->flags & (1 << estCGP))
+    if (state->flags & enumValueToBitMask(StateEntry::Cgp))
      {
          orderVector(cgsort, makeArrayRef(state->cg_p), rvecBuffer.buffer);
      }
  
      /* Reorder the global cg index */
      orderVector<int>(cgsort, dd->globalAtomGroupIndices, &sort->intBuffer);
-    /* Reorder the cginfo */
-    orderVector<int>(cgsort, fr->cginfo, &sort->intBuffer);
+    /* Reorder the atom info */
+    orderVector<int64_t>(cgsort, fr->atomInfo, &sort->int64Buffer);
      /* Set the home atom number */
-    dd->comm->atomRanges.setEnd(DDAtomRanges::Type::Home, dd->ncg_home);
+    dd->comm->atomRanges.setEnd(DDAtomRanges::Type::Home, dd->numHomeAtoms);
  
      /* The atoms are now exactly in grid order, update the grid order */
      fr->nbv->setLocalAtomOrder();
  }
  
  //! Accumulates load statistics.
-static void add_dd_statistics(gmx_domdec_t *dd)
+static void add_dd_statistics(gmx_domdec_t* dd)
  {
-    gmx_domdec_comm_t *comm = dd->comm;
+    gmx_domdec_comm_t* comm = dd->comm;
  
      for (int i = 0; i < static_cast<int>(DDAtomRanges::Type::Number); i++)
      {
          auto range = static_cast<DDAtomRanges::Type>(i);
-        comm->sum_nat[i] +=
-            comm->atomRanges.end(range) - comm->atomRanges.start(range);
+        comm->sum_nat[i] += comm->atomRanges.end(range) - comm->atomRanges.start(range);
      }
      comm->ndecomp++;
  }
  
-void reset_dd_statistics_counters(gmx_domdec_t *dd)
+void reset_dd_statistics_counters(gmx_domdec_t* dd)
  {
-    gmx_domdec_comm_t *comm = dd->comm;
+    gmx_domdec_comm_t* comm = dd->comm;
  
      /* Reset all the statistics and counters for total run counting */
      for (int i = 0; i < static_cast<int>(DDAtomRanges::Type::Number); i++)
@@ -2667,11 +2639,57 @@ void reset_dd_statistics_counters(gmx_domdec_t *dd)
      comm->load_pme = 0;
  }
  
-void print_dd_statistics(const t_commrec *cr, const t_inputrec *ir, FILE *fplog)
+namespace gmx
+{
+
+bool check_grid_jump(int64_t step, const gmx_domdec_t* dd, real cutoff, const gmx_ddbox_t* ddbox, bool bFatal)
+{
+    gmx_domdec_comm_t* comm    = dd->comm;
+    bool               invalid = false;
+
+    for (int d = 1; d < dd->ndim; d++)
+    {
+        const DDCellsizesWithDlb& cellsizes = comm->cellsizesWithDlb[d];
+        const int                 dim       = dd->dim[d];
+        const real                limit     = grid_jump_limit(comm, cutoff, d);
+        real                      bfac      = ddbox->box_size[dim];
+        if (ddbox->tric_dir[dim])
+        {
+            bfac *= ddbox->skew_fac[dim];
+        }
+        if ((cellsizes.fracUpper - cellsizes.fracLowerMax) * bfac < limit
+            || (cellsizes.fracLower - cellsizes.fracUpperMin) * bfac > -limit)
+        {
+            invalid = true;
+
+            if (bFatal)
+            {
+                char buf[22];
+
+                /* This error should never be triggered under normal
+                 * circumstances, but you never know ...
+                 */
+                gmx_fatal(FARGS,
+                          "step %s: The domain decomposition grid has shifted too much in the "
+                          "%c-direction around cell %d %d %d. This should not have happened. "
+                          "Running with fewer ranks might avoid this issue.",
+                          gmx_step_str(step, buf),
+                          dim2char(dim),
+                          dd->ci[XX],
+                          dd->ci[YY],
+                          dd->ci[ZZ]);
+            }
+        }
+    }
+
+    return invalid;
+}
+
+void print_dd_statistics(const t_commrec* cr, const t_inputrec& inputrec, FILE* fplog)
  {
-    gmx_domdec_comm_t *comm      = cr->dd->comm;
+    gmx_domdec_comm_t* comm = cr->dd->comm;
  
-    const int          numRanges = static_cast<int>(DDAtomRanges::Type::Number);
+    const int numRanges = static_cast<int>(DDAtomRanges::Type::Number);
      gmx_sumd(numRanges, comm->sum_nat, cr);
  
      if (fplog == nullptr)
@@ -2684,20 +2702,21 @@ void print_dd_statistics(const t_commrec *cr, const t_inputrec *ir, FILE *fplog)
      for (int i = static_cast<int>(DDAtomRanges::Type::Zones); i < numRanges; i++)
      {
          auto   range = static_cast<DDAtomRanges::Type>(i);
-        double av    = comm->sum_nat[i]/comm->ndecomp;
+        double av    = comm->sum_nat[i] / comm->ndecomp;
          switch (range)
          {
              case DDAtomRanges::Type::Zones:
-                fprintf(fplog,
-                        " av. #atoms communicated per step for force:  %d x %.1f\n",
-                        2, av);
+                fprintf(fplog, " av. #atoms communicated per step for force:  %d x %.1f\n", 2, av);
                  break;
              case DDAtomRanges::Type::Vsites:
                  if (cr->dd->vsite_comm)
                  {
                      fprintf(fplog,
                              " av. #atoms communicated per step for vsites: %d x %.1f\n",
-                            (EEL_PME(ir->coulombtype) || ir->coulombtype == eelEWALD) ? 3 : 2,
+                            (EEL_PME(inputrec.coulombtype)
+                             || inputrec.coulombtype == CoulombInteractionType::Ewald)
+                                    ? 3
+                                    : 2,
                              av);
                  }
                  break;
@@ -2706,65 +2725,57 @@ void print_dd_statistics(const t_commrec *cr, const t_inputrec *ir, FILE *fplog)
                  {
                      fprintf(fplog,
                              " av. #atoms communicated per step for LINCS:  %d x %.1f\n",
-                            1 + ir->nLincsIter, av);
+                            1 + inputrec.nLincsIter,
+                            av);
                  }
                  break;
-            default:
-                gmx_incons(" Unknown type for DD statistics");
+            default: gmx_incons(" Unknown type for DD statistics");
          }
      }
      fprintf(fplog, "\n");
  
-    if (comm->bRecordLoad && EI_DYNAMICS(ir->eI))
+    if (comm->ddSettings.recordLoad && EI_DYNAMICS(inputrec.eI))
      {
          print_dd_load_av(fplog, cr->dd);
      }
  }
  
-// TODO Remove fplog when group scheme and charge groups are gone
-void dd_partition_system(FILE                    *fplog,
-                         const gmx::MDLogger     &mdlog,
-                         int64_t                  step,
-                         const t_commrec         *cr,
-                         gmx_bool                 bMasterState,
-                         int                      nstglobalcomm,
-                         t_state                 *state_global,
-                         const gmx_mtop_t        &top_global,
-                         const t_inputrec        *ir,
-                         gmx::ImdSession         *imdSession,
-                         pull_t                  *pull_work,
-                         t_state                 *state_local,
-                         PaddedVector<gmx::RVec> *f,
-                         gmx::MDAtoms            *mdAtoms,
-                         gmx_localtop_t          *top_local,
-                         t_forcerec              *fr,
-                         gmx_vsite_t             *vsite,
-                         gmx::Constraints        *constr,
-                         t_nrnb                  *nrnb,
-                         gmx_wallcycle           *wcycle,
-                         gmx_bool                 bVerbose)
+//!\brief TODO Remove fplog when group scheme and charge groups are gone
+void dd_partition_system(FILE*                     fplog,
+                         const gmx::MDLogger&      mdlog,
+                         int64_t                   step,
+                         const t_commrec*          cr,
+                         bool                      bMasterState,
+                         int                       nstglobalcomm,
+                         t_state*                  state_global,
+                         const gmx_mtop_t&         top_global,
+                         const t_inputrec&         inputrec,
+                         gmx::ImdSession*          imdSession,
+                         pull_t*                   pull_work,
+                         t_state*                  state_local,
+                         gmx::ForceBuffers*        f,
+                         gmx::MDAtoms*             mdAtoms,
+                         gmx_localtop_t*           top_local,
+                         t_forcerec*               fr,
+                         gmx::VirtualSitesHandler* vsite,
+                         gmx::Constraints*         constr,
+                         t_nrnb*                   nrnb,
+                         gmx_wallcycle*            wcycle,
+                         bool                      bVerbose)
  {
-    gmx_domdec_t      *dd;
-    gmx_domdec_comm_t *comm;
-    gmx_ddbox_t        ddbox = {0};
-    int64_t            step_pcoupl;
-    rvec               cell_ns_x0, cell_ns_x1;
-    int                ncgindex_set, ncg_moved, nat_f_novirsum;
-    gmx_bool           bBoxChanged, bNStGlobalComm, bDoDLB, bCheckWhetherToTurnDlbOn, bLogLoad;
-    gmx_bool           bRedist;
-    ivec               np;
-    real               grid_density;
-    char               sbuf[22];
-
-    wallcycle_start(wcycle, ewcDOMDEC);
-
-    dd   = cr->dd;
-    comm = dd->comm;
+    gmx_ddbox_t ddbox = { 0 };
+    int         ncgindex_set;
+    char        sbuf[22];
+
+    wallcycle_start(wcycle, WallCycleCounter::Domdec);
+
+    gmx_domdec_t*      dd   = cr->dd;
+    gmx_domdec_comm_t* comm = dd->comm;
  
      // TODO if the update code becomes accessible here, use
      // upd->deform for this logic.
-    bBoxChanged = (bMasterState || inputrecDeform(ir));
-    if (ir->epc != epcNO)
+    bool bBoxChanged = (bMasterState || inputrecDeform(&inputrec));
+    if (inputrec.epc != PressureCoupling::No)
      {
          /* With nstpcouple > 1 pressure coupling happens.
           * one step after calculating the pressure.
@@ -2775,26 +2786,27 @@ void dd_partition_system(FILE                    *fplog,
           * We need to determine the last step in which p-coupling occurred.
           * MRS -- need to validate this for vv?
           */
-        int n = ir->nstpcouple;
+        int     n = inputrec.nstpcouple;
+        int64_t step_pcoupl;
          if (n == 1)
          {
              step_pcoupl = step - 1;
          }
          else
          {
-            step_pcoupl = ((step - 1)/n)*n + 1;
+            step_pcoupl = ((step - 1) / n) * n + 1;
          }
          if (step_pcoupl >= comm->partition_step)
          {
-            bBoxChanged = TRUE;
+            bBoxChanged = true;
          }
      }
  
-    bNStGlobalComm = (step % nstglobalcomm == 0);
-
+    bool bNStGlobalComm = (step % nstglobalcomm == 0);
+    bool bDoDLB;
      if (!isDlbOn(comm))
      {
-        bDoDLB = FALSE;
+        bDoDLB = false;
      }
      else
      {
@@ -2802,7 +2814,7 @@ void dd_partition_system(FILE                    *fplog,
           * Since it requires (possibly expensive) global communication,
           * we might want to do DLB less frequently.
           */
-        if (bBoxChanged || ir->epc != epcNO)
+        if (bBoxChanged || inputrec.epc != PressureCoupling::No)
          {
              bDoDLB = bBoxChanged;
          }
@@ -2813,28 +2825,27 @@ void dd_partition_system(FILE                    *fplog,
      }
  
      /* Check if we have recorded loads on the nodes */
-    if (comm->bRecordLoad && dd_load_count(comm) > 0)
+    if (comm->ddSettings.recordLoad && dd_load_count(comm) > 0)
      {
-        bCheckWhetherToTurnDlbOn = dd_dlb_get_should_check_whether_to_turn_dlb_on(dd);
+        bool bCheckWhetherToTurnDlbOn = dd_dlb_get_should_check_whether_to_turn_dlb_on(dd);
  
          /* Print load every nstlog, first and last step to the log file */
-        bLogLoad = ((ir->nstlog > 0 && step % ir->nstlog == 0) ||
-                    comm->n_load_collect == 0 ||
-                    (ir->nsteps >= 0 &&
-                     (step + ir->nstlist > ir->init_step + ir->nsteps)));
+        bool bLogLoad = ((inputrec.nstlog > 0 && step % inputrec.nstlog == 0) || comm->n_load_collect == 0
+                         || (inputrec.nsteps >= 0
+                             && (step + inputrec.nstlist > inputrec.init_step + inputrec.nsteps)));
  
          /* Avoid extra communication due to verbose screen output
           * when nstglobalcomm is set.
           */
-        if (bDoDLB || bLogLoad || bCheckWhetherToTurnDlbOn ||
-            (bVerbose && (ir->nstlist == 0 || nstglobalcomm <= ir->nstlist)))
+        if (bDoDLB || bLogLoad || bCheckWhetherToTurnDlbOn
+            || (bVerbose && (inputrec.nstlist == 0 || nstglobalcomm <= inputrec.nstlist)))
          {
              get_load_distribution(dd, wcycle);
              if (DDMASTER(dd))
              {
                  if (bLogLoad)
                  {
-                    GMX_LOG(mdlog.info).asParagraph().appendText(dd_print_load(dd, step-1));
+                    GMX_LOG(mdlog.info).asParagraph().appendText(dd_print_load(dd, step - 1));
                  }
                  if (bVerbose)
                  {
@@ -2848,15 +2859,15 @@ void dd_partition_system(FILE                    *fplog,
                  if (DDMASTER(dd))
                  {
                      /* Add the measured cycles to the running average */
-                    const float averageFactor        = 0.1F;
+                    const float averageFactor = 0.1F;
                      comm->cyclesPerStepDlbExpAverage =
-                        (1 - averageFactor)*comm->cyclesPerStepDlbExpAverage +
-                        averageFactor*comm->cycl[ddCyclStep]/comm->cycl_n[ddCyclStep];
+                            (1 - averageFactor) * comm->cyclesPerStepDlbExpAverage
+                            + averageFactor * comm->cycl[ddCyclStep] / comm->cycl_n[ddCyclStep];
                  }
-                if (comm->dlbState == DlbState::onCanTurnOff &&
-                    dd->comm->n_load_have % c_checkTurnDlbOffInterval == c_checkTurnDlbOffInterval - 1)
+                if (comm->dlbState == DlbState::onCanTurnOff
+                    && dd->comm->n_load_have % c_checkTurnDlbOffInterval == c_checkTurnDlbOffInterval - 1)
                  {
-                    gmx_bool turnOffDlb;
+                    bool turnOffDlb;
                      if (DDMASTER(dd))
                      {
                          /* If the running averaged cycles with DLB are more
@@ -2864,23 +2875,22 @@ void dd_partition_system(FILE                    *fplog,
                           * We will again run and check the cycles without DLB
                           * and we can then decide if to turn off DLB forever.
                           */
-                        turnOffDlb = (comm->cyclesPerStepDlbExpAverage >
-                                      comm->cyclesPerStepBeforeDLB);
+                        turnOffDlb = (comm->cyclesPerStepDlbExpAverage > comm->cyclesPerStepBeforeDLB);
                      }
                      dd_bcast(dd, sizeof(turnOffDlb), &turnOffDlb);
                      if (turnOffDlb)
                      {
                          /* To turn off DLB, we need to redistribute the atoms */
                          dd_collect_state(dd, state_local, state_global);
-                        bMasterState = TRUE;
+                        bMasterState = true;
                          turn_off_dlb(mdlog, dd, step);
                      }
                  }
              }
              else if (bCheckWhetherToTurnDlbOn)
              {
-                gmx_bool turnOffDlbForever = FALSE;
-                gmx_bool turnOnDlb         = FALSE;
+                bool turnOffDlbForever = false;
+                bool turnOnDlb         = false;
  
                  /* Since the timings are node dependent, the master decides */
                  if (DDMASTER(dd))
@@ -2892,9 +2902,8 @@ void dd_partition_system(FILE                    *fplog,
                       * incorrectly conclude that DLB was causing the slowdown.
                       * So we measure one nstlist block, no running average.
                       */
-                    if (comm->haveTurnedOffDlb &&
-                        comm->cycl[ddCyclStep]/comm->cycl_n[ddCyclStep] <
-                        comm->cyclesPerStepDlbExpAverage)
+                    if (comm->haveTurnedOffDlb
+                        && comm->cycl[ddCyclStep] / comm->cycl_n[ddCyclStep] < comm->cyclesPerStepDlbExpAverage)
                      {
                          /* After turning off DLB we ran nstlist steps in fewer
                           * cycles than with DLB. This likely means that DLB
@@ -2903,12 +2912,12 @@ void dd_partition_system(FILE                    *fplog,
                           * observations in close succession to turn off DLB
                           * forever.
                           */
-                        if (comm->dlbSlowerPartitioningCount > 0 &&
-                            dd->ddp_count < comm->dlbSlowerPartitioningCount + 10*c_checkTurnDlbOnInterval)
+                        if (comm->dlbSlowerPartitioningCount > 0
+                            && dd->ddp_count < comm->dlbSlowerPartitioningCount + 10 * c_checkTurnDlbOnInterval)
                          {
-                            turnOffDlbForever = TRUE;
+                            turnOffDlbForever = true;
                          }
-                        comm->haveTurnedOffDlb           = false;
+                        comm->haveTurnedOffDlb = false;
                          /* Register when we last measured DLB slowdown */
                          comm->dlbSlowerPartitioningCount = dd->ddp_count;
                      }
@@ -2921,10 +2930,9 @@ void dd_partition_system(FILE                    *fplog,
                           * cost on the PME ranks, which will then surely result
                           * in lower total performance.
                           */
-                        if (cr->npmenodes > 0 &&
-                            dd_pme_f_ratio(dd) > 1 - DD_PERF_LOSS_DLB_ON)
+                        if (comm->ddRankSetup.usePmeOnlyRanks && dd_pme_f_ratio(dd) > 1 - DD_PERF_LOSS_DLB_ON)
                          {
-                            turnOnDlb = FALSE;
+                            turnOnDlb = false;
                          }
                          else
                          {
@@ -2934,12 +2942,9 @@ void dd_partition_system(FILE                    *fplog,
                  }
                  struct
                  {
-                    gmx_bool turnOffDlbForever;
-                    gmx_bool turnOnDlb;
-                }
-                bools {
-                    turnOffDlbForever, turnOnDlb
-                };
+                    bool turnOffDlbForever;
+                    bool turnOnDlb;
+                } bools{ turnOffDlbForever, turnOnDlb };
                  dd_bcast(dd, sizeof(bools), &bools);
                  if (bools.turnOffDlbForever)
                  {
@@ -2948,62 +2953,66 @@ void dd_partition_system(FILE                    *fplog,
                  else if (bools.turnOnDlb)
                  {
                      turn_on_dlb(mdlog, dd, step);
-                    bDoDLB = TRUE;
+                    bDoDLB = true;
                  }
              }
          }
          comm->n_load_have++;
      }
  
-    bRedist = FALSE;
+    bool bRedist = false;
      if (bMasterState)
      {
          /* Clear the old state */
-        clearDDStateIndices(dd, 0, 0);
+        clearDDStateIndices(dd, false);
          ncgindex_set = 0;
  
          auto xGlobal = positionsFromStatePointer(state_global);
  
-        set_ddbox(*dd, true,
-                  DDMASTER(dd) ? state_global->box : nullptr,
-                  true, xGlobal,
-                  &ddbox);
+        set_ddbox(*dd, true, DDMASTER(dd) ? state_global->box : nullptr, true, xGlobal, &ddbox);
  
-        distributeState(mdlog, dd, top_global, state_global, ddbox, state_local, f);
+        distributeState(mdlog, dd, top_global, state_global, ddbox, state_local);
  
          /* Ensure that we have space for the new distribution */
-        dd_check_alloc_ncg(fr, state_local, f, dd->ncg_home);
+        dd_resize_atominfo_and_state(fr, state_local, dd->numHomeAtoms);
  
          inc_nrnb(nrnb, eNR_CGCM, comm->atomRanges.numHomeAtoms());
  
-        dd_set_cginfo(dd->globalAtomGroupIndices, 0, dd->ncg_home, fr, comm->bLocalCG);
+        dd_set_atominfo(dd->globalAtomGroupIndices, 0, dd->numHomeAtoms, fr);
      }
      else if (state_local->ddp_count != dd->ddp_count)
      {
          if (state_local->ddp_count > dd->ddp_count)
          {
-            gmx_fatal(FARGS, "Internal inconsistency state_local->ddp_count (%d) > dd->ddp_count (%" PRId64 ")", state_local->ddp_count, dd->ddp_count);
+            gmx_fatal(FARGS,
+                      "Internal inconsistency state_local->ddp_count (%d) > dd->ddp_count (%" PRId64
+                      ")",
+                      state_local->ddp_count,
+                      dd->ddp_count);
          }
  
          if (state_local->ddp_count_cg_gl != state_local->ddp_count)
          {
-            gmx_fatal(FARGS, "Internal inconsistency state_local->ddp_count_cg_gl (%d) != state_local->ddp_count (%d)", state_local->ddp_count_cg_gl, state_local->ddp_count);
+            gmx_fatal(FARGS,
+                      "Internal inconsistency state_local->ddp_count_cg_gl (%d) != "
+                      "state_local->ddp_count (%d)",
+                      state_local->ddp_count_cg_gl,
+                      state_local->ddp_count);
          }
  
          /* Clear the old state */
-        clearDDStateIndices(dd, 0, 0);
+        clearDDStateIndices(dd, false);
  
          /* Restore the atom group indices from state_local */
          restoreAtomGroups(dd, state_local);
          make_dd_indices(dd, 0);
-        ncgindex_set = dd->ncg_home;
+        ncgindex_set = dd->numHomeAtoms;
  
          inc_nrnb(nrnb, eNR_CGCM, comm->atomRanges.numHomeAtoms());
  
-        dd_set_cginfo(dd->globalAtomGroupIndices, 0, dd->ncg_home, fr, comm->bLocalCG);
+        dd_set_atominfo(dd->globalAtomGroupIndices, 0, dd->numHomeAtoms, fr);
  
-        set_ddbox(*dd, bMasterState, state_local->box,
-                  true, state_local->x, &ddbox);
+        set_ddbox(*dd, bMasterState, state_local->box, true, state_local->x, &ddbox);
  
          bRedist = isDlbOn(comm);
      }
@@ -3012,7 +3021,7 @@ void dd_partition_system(FILE                    *fplog,
          /* We have the full state, only redistribute the cgs */
  
          /* Clear the non-home indices */
-        clearDDStateIndices(dd, dd->ncg_home, comm->atomRanges.numHomeAtoms());
+        clearDDStateIndices(dd, true);
          ncgindex_set = 0;
  
          /* To avoid global communication, we do not recompute the extent
@@ -3021,31 +3030,30 @@ void dd_partition_system(FILE                    *fplog,
           */
          if (!bNStGlobalComm)
          {
-            copy_rvec(comm->box0, ddbox.box0    );
+            copy_rvec(comm->box0, ddbox.box0);
              copy_rvec(comm->box_size, ddbox.box_size);
          }
-        set_ddbox(*dd, bMasterState, state_local->box,
-                  bNStGlobalComm, state_local->x, &ddbox);
+        set_ddbox(*dd, bMasterState, state_local->box, bNStGlobalComm, state_local->x, &ddbox);
  
-        bBoxChanged = TRUE;
-        bRedist     = TRUE;
+        bBoxChanged = true;
+        bRedist     = true;
      }
      /* Copy needed for dim's without pbc when avoiding communication */
-    copy_rvec(ddbox.box0, comm->box0    );
+    copy_rvec(ddbox.box0, comm->box0);
      copy_rvec(ddbox.box_size, comm->box_size);
  
-    set_dd_cell_sizes(dd, &ddbox, dd->unitCellInfo.ddBoxIsDynamic, bMasterState, bDoDLB,
-                      step, wcycle);
+    set_dd_cell_sizes(dd, &ddbox, dd->unitCellInfo.ddBoxIsDynamic, bMasterState, bDoDLB, step, wcycle);
  
-    if (comm->nstDDDumpGrid > 0 && step % comm->nstDDDumpGrid == 0)
+    if (comm->ddSettings.nstDDDumpGrid > 0 && step % comm->ddSettings.nstDDDumpGrid == 0)
      {
          write_dd_grid_pdb("dd_grid", step, dd, state_local->box, &ddbox);
      }
  
      if (comm->systemInfo.useUpdateGroups)
      {
-        comm->updateGroupsCog->addCogs(gmx::arrayRefFromArray(dd->globalAtomGroupIndices.data(), dd->ncg_home),
-                                       state_local->x);
+        comm->updateGroupsCog->addCogs(
+                gmx::arrayRefFromArray(dd->globalAtomGroupIndices.data(), dd->numHomeAtoms),
+                state_local->x);
      }
  
      /* Check if we should sort the charge groups */
@@ -3056,45 +3064,46 @@ void dd_partition_system(FILE                    *fplog,
       * Thus we need to keep track of how many charge groups will move for
       * obtaining correct local charge group / atom counts.
       */
-    ncg_moved = 0;
+    int ncg_moved = 0;
      if (bRedist)
      {
-        wallcycle_sub_start(wcycle, ewcsDD_REDIST);
+        wallcycle_sub_start(wcycle, WallCycleSubCounter::DDRedist);
  
-        ncgindex_set = dd->ncg_home;
-        dd_redistribute_cg(fplog, step, dd, ddbox.tric_dir,
-                           state_local, f, fr,
-                           nrnb, &ncg_moved);
+        ncgindex_set = dd->numHomeAtoms;
+        dd_redistribute_cg(fplog, step, dd, ddbox.tric_dir, state_local, fr, nrnb, &ncg_moved);
  
          GMX_RELEASE_ASSERT(bSortCG, "Sorting is required after redistribution");
  
          if (comm->systemInfo.useUpdateGroups)
          {
-            comm->updateGroupsCog->addCogs(gmx::arrayRefFromArray(dd->globalAtomGroupIndices.data(), dd->ncg_home),
-                                           state_local->x);
+            comm->updateGroupsCog->addCogs(
+                    gmx::arrayRefFromArray(dd->globalAtomGroupIndices.data(), dd->numHomeAtoms),
+                    state_local->x);
          }
  
-        wallcycle_sub_stop(wcycle, ewcsDD_REDIST);
+        wallcycle_sub_stop(wcycle, WallCycleSubCounter::DDRedist);
      }
  
-    // TODO: Integrate this code in the nbnxm module
-    get_nsgrid_boundaries(ddbox.nboundeddim, state_local->box,
-                          dd, &ddbox,
-                          &comm->cell_x0, &comm->cell_x1,
-                          dd->ncg_home, as_rvec_array(state_local->x.data()),
-                          cell_ns_x0, cell_ns_x1, &grid_density);
+    RVec cell_ns_x0, cell_ns_x1;
+    get_nsgrid_boundaries(ddbox.nboundeddim,
+                          state_local->box,
+                          dd,
+                          &ddbox,
+                          &comm->cell_x0,
+                          &comm->cell_x1,
+                          dd->numHomeAtoms,
+                          as_rvec_array(state_local->x.data()),
+                          cell_ns_x0,
+                          cell_ns_x1);
  
      if (bBoxChanged)
      {
          comm_dd_ns_cell_sizes(dd, &ddbox, cell_ns_x0, cell_ns_x1, step);
      }
  
-    /* We need to store tric_dir for dd_get_ns_ranges called from ns.c */
-    copy_ivec(ddbox.tric_dir, comm->tric_dir);
-
      if (bSortCG)
      {
-        wallcycle_sub_start(wcycle, ewcsDD_GRID);
+        wallcycle_sub_start(wcycle, WallCycleSubCounter::DDGrid);
  
          /* Sort the state on charge group position.
           * This enables exact restarts from this step.
@@ -3105,43 +3114,44 @@ void dd_partition_system(FILE                    *fplog,
          /* Fill the ns grid with the home cell,
           * so we can sort with the indices.
           */
-        set_zones_ncg_home(dd);
+        set_zones_numHomeAtoms(dd);
  
          set_zones_size(dd, state_local->box, &ddbox, 0, 1, ncg_moved);
  
-        nbnxn_put_on_grid(fr->nbv.get(), state_local->box,
+        nbnxn_put_on_grid(fr->nbv.get(),
+                          state_local->box,
                            0,
                            comm->zones.size[0].bb_x0,
                            comm->zones.size[0].bb_x1,
                            comm->updateGroupsCog.get(),
-                          0, dd->ncg_home,
+                          { 0, dd->numHomeAtoms },
                            comm->zones.dens_zone0,
-                          fr->cginfo,
+                          fr->atomInfo,
                            state_local->x,
-                          ncg_moved, bRedist ? comm->movedBuffer.data() : nullptr);
+                          ncg_moved,
+                          bRedist ? comm->movedBuffer.data() : nullptr);
  
          if (debug)
          {
-            fprintf(debug, "Step %s, sorting the %d home charge groups\n",
-                    gmx_step_str(step, sbuf), dd->ncg_home);
+            fprintf(debug, "Step %s, sorting the %d home charge groups\n", gmx_step_str(step, sbuf), dd->numHomeAtoms);
          }
          dd_sort_state(dd, fr, state_local);
  
          /* After sorting and compacting we set the correct size */
-        dd_resize_state(state_local, f, comm->atomRanges.numHomeAtoms());
+        state_change_natoms(state_local, comm->atomRanges.numHomeAtoms());
  
          /* Rebuild all the indices */
-        dd->ga2la->clear();
+        dd->ga2la->clear(false);
          ncgindex_set = 0;
  
-        wallcycle_sub_stop(wcycle, ewcsDD_GRID);
+        wallcycle_sub_stop(wcycle, WallCycleSubCounter::DDGrid);
      }
      else
      {
          /* With the group scheme the sorting array is part of the DD state,
           * but it just got out of sync, so mark as invalid by emptying it.
           */
-        if (ir->cutoff_scheme == ecutsGROUP)
+        if (inputrec.cutoff_scheme == CutoffScheme::Group)
          {
              comm->sort->sorted.clear();
          }
@@ -3155,110 +3165,116 @@ void dd_partition_system(FILE                    *fplog,
          comm->updateGroupsCog->clear();
      }
  
-    wallcycle_sub_start(wcycle, ewcsDD_SETUPCOMM);
+    wallcycle_sub_start(wcycle, WallCycleSubCounter::DDSetupComm);
+
+    /* Set the induces for the home atoms */
+    set_zones_numHomeAtoms(dd);
+    make_dd_indices(dd, ncgindex_set);
  
      /* Setup up the communication and communicate the coordinates */
-    setup_dd_communication(dd, state_local->box, &ddbox, fr, state_local, f);
+    setup_dd_communication(dd, state_local->box, &ddbox, fr, state_local);
  
-    /* Set the indices */
-    make_dd_indices(dd, ncgindex_set);
+    /* Set the indices for the halo atoms */
+    make_dd_indices(dd, dd->numHomeAtoms);
  
      /* Set the charge group boundaries for neighbor searching */
      set_cg_boundaries(&comm->zones);
  
-    if (fr->cutoff_scheme == ecutsVERLET)
-    {
-        /* When bSortCG=true, we have already set the size for zone 0 */
-        set_zones_size(dd, state_local->box, &ddbox,
-                       bSortCG ? 1 : 0, comm->zones.n,
-                       0);
-    }
+    /* When bSortCG=true, we have already set the size for zone 0 */
+    set_zones_size(dd, state_local->box, &ddbox, bSortCG ? 1 : 0, comm->zones.n, 0);
  
-    wallcycle_sub_stop(wcycle, ewcsDD_SETUPCOMM);
+    wallcycle_sub_stop(wcycle, WallCycleSubCounter::DDSetupComm);
  
      /*
         write_dd_pdb("dd_home",step,"dump",top_global,cr,
                   -1,state_local->x.rvec_array(),state_local->box);
       */
  
-    wallcycle_sub_start(wcycle, ewcsDD_MAKETOP);
+    wallcycle_sub_start(wcycle, WallCycleSubCounter::DDMakeTop);
  
      /* Extract a local topology from the global topology */
+    IVec numPulses;
      for (int i = 0; i < dd->ndim; i++)
      {
-        np[dd->dim[i]] = comm->cd[i].numPulses();
+        numPulses[dd->dim[i]] = comm->cd[i].numPulses();
      }
-    dd_make_local_top(dd, &comm->zones, dd->unitCellInfo.npbcdim, state_local->box,
-                      comm->cellsize_min, np,
-                      fr,
-                      state_local->x.rvec_array(),
-                      top_global, top_local);
+    int numBondedInteractionsToReduce = dd_make_local_top(*dd,
+                                                          comm->zones,
+                                                          dd->unitCellInfo.npbcdim,
+                                                          state_local->box,
+                                                          comm->cellsize_min,
+                                                          numPulses,
+                                                          fr,
+                                                          state_local->x,
+                                                          top_global,
+                                                          fr->atomInfo,
+                                                          top_local);
+    dd->localTopologyChecker->scheduleCheckOfLocalTopology(numBondedInteractionsToReduce);
  
-    wallcycle_sub_stop(wcycle, ewcsDD_MAKETOP);
+    wallcycle_sub_stop(wcycle, WallCycleSubCounter::DDMakeTop);
  
-    wallcycle_sub_start(wcycle, ewcsDD_MAKECONSTR);
+    wallcycle_sub_start(wcycle, WallCycleSubCounter::DDMakeConstr);
  
      /* Set up the special atom communication */
      int n = comm->atomRanges.end(DDAtomRanges::Type::Zones);
-    for (int i = static_cast<int>(DDAtomRanges::Type::Zones) + 1; i < static_cast<int>(DDAtomRanges::Type::Number); i++)
+    for (int i = static_cast<int>(DDAtomRanges::Type::Zones) + 1;
+         i < static_cast<int>(DDAtomRanges::Type::Number);
+         i++)
      {
          auto range = static_cast<DDAtomRanges::Type>(i);
          switch (range)
          {
              case DDAtomRanges::Type::Vsites:
-                if (vsite && vsite->numInterUpdategroupVsites)
+                if (vsite && vsite->numInterUpdategroupVirtualSites())
                  {
                      n = dd_make_local_vsites(dd, n, top_local->idef.il);
                  }
                  break;
              case DDAtomRanges::Type::Constraints:
-                if (dd->splitConstraints || dd->splitSettles)
+                if (dd->comm->systemInfo.mayHaveSplitConstraints || dd->comm->systemInfo.mayHaveSplitSettles)
                  {
                      /* Only for inter-cg constraints we need special code */
-                    n = dd_make_local_constraints(dd, n, &top_global, fr->cginfo.data(),
-                                                  constr, ir->nProjOrder,
+                    n = dd_make_local_constraints(dd,
+                                                  n,
+                                                  top_global,
+                                                  fr->atomInfo,
+                                                  constr,
+                                                  inputrec.nProjOrder,
                                                    top_local->idef.il);
                  }
                  break;
-            default:
-                gmx_incons("Unknown special atom type setup");
+            default: gmx_incons("Unknown special atom type setup");
          }
          comm->atomRanges.setEnd(range, n);
      }
  
-    wallcycle_sub_stop(wcycle, ewcsDD_MAKECONSTR);
+    wallcycle_sub_stop(wcycle, WallCycleSubCounter::DDMakeConstr);
  
-    wallcycle_sub_start(wcycle, ewcsDD_TOPOTHER);
+    wallcycle_sub_start(wcycle, WallCycleSubCounter::DDTopOther);
  
      /* Make space for the extra coordinates for virtual site
       * or constraint communication.
       */
      state_local->natoms = comm->atomRanges.numAtomsTotal();
  
-    dd_resize_state(state_local, f, state_local->natoms);
+    state_change_natoms(state_local, state_local->natoms);
  
-    if (fr->haveDirectVirialContributions)
+    int nat_f_novirsum;
+    if (vsite && vsite->numInterUpdategroupVirtualSites())
      {
-        if (vsite && vsite->numInterUpdategroupVsites)
+        nat_f_novirsum = comm->atomRanges.end(DDAtomRanges::Type::Vsites);
+    }
+    else
+    {
+        if (EEL_FULL(inputrec.coulombtype) && dd->haveExclusions)
          {
-            nat_f_novirsum = comm->atomRanges.end(DDAtomRanges::Type::Vsites);
+            nat_f_novirsum = comm->atomRanges.end(DDAtomRanges::Type::Zones);
          }
          else
          {
-            if (EEL_FULL(ir->coulombtype) && dd->n_intercg_excl > 0)
-            {
-                nat_f_novirsum = comm->atomRanges.end(DDAtomRanges::Type::Zones);
-            }
-            else
-            {
-                nat_f_novirsum = comm->atomRanges.numHomeAtoms();
-            }
+            nat_f_novirsum = comm->atomRanges.numHomeAtoms();
          }
      }
-    else
-    {
-        nat_f_novirsum = 0;
-    }
  
      /* Set the number of atoms required for the force calculation.
       * Forces need to be constrained when doing energy
@@ -3266,32 +3282,37 @@ void dd_partition_system(FILE                    *fplog,
       * allocation, zeroing and copying, but this is probably not worth
       * the complications and checking.
       */
-    forcerec_set_ranges(fr, dd->ncg_home, dd->globalAtomGroupIndices.size(),
+    forcerec_set_ranges(fr,
                          comm->atomRanges.end(DDAtomRanges::Type::Zones),
                          comm->atomRanges.end(DDAtomRanges::Type::Constraints),
                          nat_f_novirsum);
  
      /* Update atom data for mdatoms and several algorithms */
-    mdAlgorithmsSetupAtomData(cr, ir, top_global, top_local, fr,
-                              nullptr, mdAtoms, constr, vsite, nullptr);
+    mdAlgorithmsSetupAtomData(cr, inputrec, top_global, top_local, fr, f, mdAtoms, constr, vsite, nullptr);
  
-    auto mdatoms = mdAtoms->mdatoms();
+    auto* mdatoms = mdAtoms->mdatoms();
      if (!thisRankHasDuty(cr, DUTY_PME))
      {
          /* Send the charges and/or c6/sigmas to our PME only node */
-        gmx_pme_send_parameters(cr,
-                                fr->ic,
-                                mdatoms->nChargePerturbed != 0, mdatoms->nTypePerturbed != 0,
-                                mdatoms->chargeA, mdatoms->chargeB,
-                                mdatoms->sqrt_c6A, mdatoms->sqrt_c6B,
-                                mdatoms->sigmaA, mdatoms->sigmaB,
-                                dd_pme_maxshift_x(dd), dd_pme_maxshift_y(dd));
-    }
-
-    if (ir->bPull)
-    {
-        /* Update the local pull groups */
-        dd_make_local_pull_groups(cr, pull_work);
+        gmx_pme_send_parameters(
+                cr,
+                *fr->ic,
+                mdatoms->nChargePerturbed != 0,
+                mdatoms->nTypePerturbed != 0,
+                mdatoms->chargeA ? gmx::arrayRefFromArray(mdatoms->chargeA, mdatoms->nr)
+                                 : gmx::ArrayRef<real>{},
+                mdatoms->chargeB ? gmx::arrayRefFromArray(mdatoms->chargeB, mdatoms->nr)
+                                 : gmx::ArrayRef<real>{},
+                mdatoms->sqrt_c6A ? gmx::arrayRefFromArray(mdatoms->sqrt_c6A, mdatoms->nr)
+                                  : gmx::ArrayRef<real>{},
+                mdatoms->sqrt_c6B ? gmx::arrayRefFromArray(mdatoms->sqrt_c6B, mdatoms->nr)
+                                  : gmx::ArrayRef<real>{},
+                mdatoms->sigmaA ? gmx::arrayRefFromArray(mdatoms->sigmaA, mdatoms->nr)
+                                : gmx::ArrayRef<real>{},
+                mdatoms->sigmaB ? gmx::arrayRefFromArray(mdatoms->sigmaB, mdatoms->nr)
+                                : gmx::ArrayRef<real>{},
+                dd_pme_maxshift_x(*dd),
+                dd_pme_maxshift_y(*dd));
      }
  
      if (dd->atomSets != nullptr)
@@ -3300,7 +3321,14 @@ void dd_partition_system(FILE                    *fplog,
          dd->atomSets->setIndicesInDomainDecomposition(*(dd->ga2la));
      }
  
-    /* Update the local atoms to be communicated via the IMD protocol if bIMD is TRUE. */
+    // The pull group construction can need the atom sets updated above
+    if (inputrec.bPull)
+    {
+        /* Update the local pull groups */
+        dd_make_local_pull_groups(cr, pull_work);
+    }
+
+    /* Update the local atoms to be communicated via the IMD protocol if bIMD is true. */
      imdSession->dd_make_local_IMD_atoms(dd);
  
      add_dd_statistics(dd);
@@ -3312,15 +3340,21 @@ void dd_partition_system(FILE                    *fplog,
       * the last vsite construction, we need to communicate the constructing
       * atom coordinates again (for spreading the forces this MD step).
       */
-    dd_move_x_vsites(dd, state_local->box, state_local->x.rvec_array());
+    dd_move_x_vsites(*dd, state_local->box, state_local->x.rvec_array());
  
-    wallcycle_sub_stop(wcycle, ewcsDD_TOPOTHER);
+    wallcycle_sub_stop(wcycle, WallCycleSubCounter::DDTopOther);
  
-    if (comm->nstDDDump > 0 && step % comm->nstDDDump == 0)
+    if (comm->ddSettings.nstDDDump > 0 && step % comm->ddSettings.nstDDDump == 0)
      {
-        dd_move_x(dd, state_local->box, state_local->x, nullWallcycle);
-        write_dd_pdb("dd_dump", step, "dump", &top_global, cr,
-                     -1, state_local->x.rvec_array(), state_local->box);
+        dd_move_x(dd, state_local->box, state_local->x, nullptr);
+        write_dd_pdb("dd_dump",
+                     step,
+                     "dump",
+                     top_global,
+                     cr,
+                     -1,
+                     state_local->x.rvec_array(),
+                     state_local->box);
      }
  
      /* Store the partitioning step */
@@ -3338,32 +3372,13 @@ void dd_partition_system(FILE                    *fplog,
          comm->master_cg_ddp_count = (bSortCG ? 0 : dd->ddp_count);
      }
  
-    if (comm->DD_debug > 0)
+    if (comm->ddSettings.DD_debug > 0)
      {
          /* Set the env var GMX_DD_DEBUG if you suspect corrupted indices */
-        check_index_consistency(dd, top_global.natoms, ncg_mtop(&top_global),
-                                "after partitioning");
+        check_index_consistency(dd, top_global.natoms, "after partitioning");
      }
  
-    wallcycle_stop(wcycle, ewcDOMDEC);
+    wallcycle_stop(wcycle, WallCycleCounter::Domdec);
  }
  
-/*! \brief Check whether bonded interactions are missing, if appropriate */
-void checkNumberOfBondedInteractions(const gmx::MDLogger  &mdlog,
-                                     t_commrec            *cr,
-                                     int                   totalNumberOfBondedInteractions,
-                                     const gmx_mtop_t     *top_global,
-                                     const gmx_localtop_t *top_local,
-                                     const rvec           *x,
-                                     const matrix          box,
-                                     bool                 *shouldCheckNumberOfBondedInteractions)
-{
-    if (*shouldCheckNumberOfBondedInteractions)
-    {
-        if (totalNumberOfBondedInteractions != cr->dd->nbonded_global)
-        {
-            dd_print_missing_interactions(mdlog, cr, totalNumberOfBondedInteractions, top_global, top_local, x, box); // Does not return
-        }
-        *shouldCheckNumberOfBondedInteractions = false;
-    }
-}
+} // namespace gmx