Manually sort some includes in src/gromacs

[alexxy/gromacs.git] / src / gromacs / gmxlib / gmx_thread_affinity.c
diff --git a/src/gromacs/gmxlib/gmx_thread_affinity.c b/src/gromacs/gmxlib/gmx_thread_affinity.c

index 919af6eef8643ec6ea421345e1a9d6a69b42c27f..69e256fbca94283f969d57c9f7473f63103b940d 100644 (file)
--- a/src/gromacs/gmxlib/gmx_thread_affinity.c
+++ b/src/gromacs/gmxlib/gmx_thread_affinity.c
@@ -1,10 +1,10 @@
  /*
   * This file is part of the GROMACS molecular simulation package.
   *
- * Copyright (c) 2012, by the GROMACS development team, led by
- * David van der Spoel, Berk Hess, Erik Lindahl, and including many
- * others, as listed in the AUTHORS file in the top-level source
- * directory and at http://www.gromacs.org.
+ * Copyright (c) 2012,2013,2014, by the GROMACS development team, led by
+ * Mark Abraham, David van der Spoel, Berk Hess, and Erik Lindahl,
+ * and including many others, as listed in the AUTHORS file in the
+ * top-level source directory and at http://www.gromacs.org.
   *
   * GROMACS is free software; you can redistribute it and/or
   * modify it under the terms of the GNU Lesser General Public License
@@ -32,29 +32,39 @@
   * To help us fund GROMACS development, we humbly ask that you cite
   * the research papers on the package. Check out http://www.gromacs.org.
   */
-#ifdef HAVE_CONFIG_H
-#include <config.h>
-#endif
-#if defined(HAVE_SCHED_H) && defined(HAVE_SCHED_GETAFFINITY)
-#define _GNU_SOURCE
-#include <sched.h>
-#include <sys/syscall.h>
+#include "gmxpre.h"
+
+#include "config.h"
+
+#ifdef HAVE_SCHED_AFFINITY
+#  ifndef _GNU_SOURCE
+#    define _GNU_SOURCE 1
+#  endif
+#  include <sched.h>
+#  include <sys/syscall.h>
  #endif
+
+#include "gromacs/legacyheaders/gmx_thread_affinity.h"
+
  #include <assert.h>
+#include <errno.h>
  #include <stdio.h>
-#include "typedefs.h"
-#include "types/commrec.h"
-#include "types/hw_info.h"
-#include "gmx_cpuid.h"
-#include "gmx_omp.h"
-#include "gmx_omp_nthreads.h"
-#include "mdrun.h"
-#include "md_logging.h"
-#include "statutil.h"
-#include "gmx_thread_affinity.h"
+#include <string.h>
  
  #include "thread_mpi/threads.h"
  
+#include "gromacs/legacyheaders/copyrite.h"
+#include "gromacs/legacyheaders/gmx_cpuid.h"
+#include "gromacs/legacyheaders/gmx_omp_nthreads.h"
+#include "gromacs/legacyheaders/md_logging.h"
+#include "gromacs/legacyheaders/typedefs.h"
+#include "gromacs/legacyheaders/types/commrec.h"
+#include "gromacs/legacyheaders/types/hw_info.h"
+#include "gromacs/utility/basenetwork.h"
+#include "gromacs/utility/cstringutil.h"
+#include "gromacs/utility/fatalerror.h"
+#include "gromacs/utility/gmxomp.h"
+#include "gromacs/utility/smalloc.h"
  
  static int
  get_thread_affinity_layout(FILE *fplog,
@@ -68,6 +78,7 @@ get_thread_affinity_layout(FILE *fplog,
      const int * pkg_id;
      const int * core_id;
      const int * hwthread_id;
+    gmx_bool    bPickPinStride;
  
      if (pin_offset < 0)
      {
@@ -84,6 +95,7 @@ get_thread_affinity_layout(FILE *fplog,
  
      if (rc != 0)
      {
+        /* topology information not available or invalid, ignore it */
          nhwthreads      = hwinfo->nthreads_hw_avail;
          *locality_order = NULL;
  
@@ -91,23 +103,36 @@ get_thread_affinity_layout(FILE *fplog,
          {
              /* We don't know anything about the hardware, don't pin */
              md_print_warn(cr, fplog,
-                          "We don't know how many logical cores we have, will not pin threads");
+                          "NOTE: We don't know how many logical cores we have, will not pin threads");
  
              return -1;
          }
      }
  
+    if (nthreads > nhwthreads)
+    {
+        /* We are oversubscribing, don't pin */
+        md_print_warn(NULL, fplog,
+                      "WARNING: Oversubscribing the CPU, will not pin threads");
+
+        return -1;
+    }
+
      if (pin_offset + nthreads > nhwthreads)
      {
          /* We are oversubscribing, don't pin */
          md_print_warn(NULL, fplog,
-                      "More threads requested than available logical cores, will not pin threads");
+                      "WARNING: The requested pin offset is too large for the available logical cores,\n"
+                      "         will not pin threads");
  
          return -1;
      }
  
-    /* Check if we need to choose the pinning stride */
-    if (*pin_stride == 0)
+
+    /* do we need to choose the pinning stride? */
+    bPickPinStride = (*pin_stride == 0);
+
+    if (bPickPinStride)
      {
          if (rc == 0 && pin_offset + nthreads*nhwthreads_per_core <= nhwthreads)
          {
@@ -127,25 +152,29 @@ get_thread_affinity_layout(FILE *fplog,
               */
              *pin_stride = (nhwthreads - pin_offset)/nthreads;
          }
-
-        if (fplog != NULL)
-        {
-            fprintf(fplog, "Pinning threads with a logical core stride of %d\n",
-                    *pin_stride);
-        }
      }
      else
      {
-        if (pin_offset + nthreads*(*pin_stride) > nhwthreads)
+        /* Check the placement of the thread with the largest index to make sure
+         * that the offset & stride doesn't cause pinning beyond the last hardware thread. */
+        if (pin_offset + (nthreads-1)*(*pin_stride) >= nhwthreads)
          {
              /* We are oversubscribing, don't pin */
              md_print_warn(NULL, fplog,
-                          "The requested pinning stride is too large for the available logical cores, will not pin threads");
+                          "WARNING: The requested pinning stride is too large for the available logical cores,\n"
+                          "         will not pin threads");
  
              return -1;
          }
      }
  
+    if (fplog != NULL)
+    {
+        fprintf(fplog, "Pinning threads with a%s logical core stride of %d\n",
+                bPickPinStride ? "n auto-selected" : " user-specified",
+                *pin_stride);
+    }
+
      return 0;
  }
  
@@ -162,11 +191,9 @@ void
  gmx_set_thread_affinity(FILE                *fplog,
                          const t_commrec     *cr,
                          gmx_hw_opt_t        *hw_opt,
-                        int                  nthreads_pme,
-                        const gmx_hw_info_t *hwinfo,
-                        const t_inputrec    *inputrec)
+                        const gmx_hw_info_t *hwinfo)
  {
-    int        nth_affinity_set, thread_id_node, thread_id,
+    int        nth_affinity_set, thread0_id_node,
                 nthread_local, nthread_node, nthread_hw_max, nphyscore;
      int        offset;
      const int *locality_order;
@@ -178,19 +205,22 @@ gmx_set_thread_affinity(FILE                *fplog,
          return;
      }
  
-#ifndef __APPLE__
      /* If the tMPI thread affinity setting is not supported encourage the user
       * to report it as it's either a bug or an exotic platform which we might
       * want to support. */
      if (tMPI_Thread_setaffinity_support() != TMPI_SETAFFINITY_SUPPORT_YES)
      {
+        /* we know Mac OS doesn't support setting thread affinity, so there's
+           no point in warning the user in that case. In any other case
+           the user might be able to do something about it. */
+#ifndef __APPLE__
          md_print_warn(NULL, fplog,
                        "Can not set thread affinities on the current platform. On NUMA systems this\n"
                        "can cause performance degradation. If you think your platform should support\n"
                        "setting affinities, contact the GROMACS developers.");
+#endif  /* __APPLE__ */
          return;
      }
-#endif /* __APPLE__ */
  
      /* threads on this MPI process or TMPI thread */
      if (cr->duty & DUTY_PP)
@@ -203,8 +233,8 @@ gmx_set_thread_affinity(FILE                *fplog,
      }
  
      /* map the current process to cores */
-    thread_id_node = 0;
-    nthread_node   = nthread_local;
+    thread0_id_node = 0;
+    nthread_node    = nthread_local;
  #ifdef GMX_MPI
      if (PAR(cr) || MULTISIM(cr))
      {
@@ -213,11 +243,12 @@ gmx_set_thread_affinity(FILE                *fplog,
           */
          MPI_Comm comm_intra;
  
-        MPI_Comm_split(MPI_COMM_WORLD, gmx_hostname_num(), cr->rank_intranode,
+        MPI_Comm_split(MPI_COMM_WORLD,
+                       gmx_physicalnode_id_hash(), cr->rank_intranode,
                         &comm_intra);
-        MPI_Scan(&nthread_local, &thread_id_node, 1, MPI_INT, MPI_SUM, comm_intra);
+        MPI_Scan(&nthread_local, &thread0_id_node, 1, MPI_INT, MPI_SUM, comm_intra);
          /* MPI_Scan is inclusive, but here we need exclusive */
-        thread_id_node -= nthread_local;
+        thread0_id_node -= nthread_local;
          /* Get the total number of threads on this physical node */
          MPI_Allreduce(&nthread_local, &nthread_node, 1, MPI_INT, MPI_SUM, comm_intra);
          MPI_Comm_free(&comm_intra);
@@ -250,6 +281,7 @@ gmx_set_thread_affinity(FILE                *fplog,
                                      nthread_node,
                                      offset, &hw_opt->core_pinning_stride,
                                      &locality_order);
+
      if (rc != 0)
      {
          /* Incompatible layout, don't pin, warning was already issued */
@@ -263,15 +295,15 @@ gmx_set_thread_affinity(FILE                *fplog,
       * of threads on which we succeeded.
       */
      nth_affinity_set = 0;
-#pragma omp parallel firstprivate(thread_id_node) num_threads(nthread_local) \
-    reduction(+:nth_affinity_set)
+#pragma omp parallel num_threads(nthread_local) reduction(+:nth_affinity_set)
      {
+        int      thread_id, thread_id_node;
          int      index, core;
          gmx_bool setaffinity_ret;
  
-        thread_id       = gmx_omp_get_thread_num();
-        thread_id_node += thread_id;
-        index           = offset + thread_id_node*hw_opt->core_pinning_stride;
+        thread_id      = gmx_omp_get_thread_num();
+        thread_id_node = thread0_id_node + thread_id;
+        index          = offset + thread_id_node*hw_opt->core_pinning_stride;
          if (locality_order != NULL)
          {
              core = locality_order[index];
@@ -288,8 +320,8 @@ gmx_set_thread_affinity(FILE                *fplog,
  
          if (debug)
          {
-            fprintf(debug, "On rank %2d, thread %2d, core %2d the affinity setting returned %d\n",
-                    cr->nodeid, gmx_omp_get_thread_num(), core, setaffinity_ret);
+            fprintf(debug, "On rank %2d, thread %2d, index %2d, core %2d the affinity setting returned %d\n",
+                    cr->nodeid, gmx_omp_get_thread_num(), index, core, setaffinity_ret);
          }
      }
  
@@ -310,27 +342,33 @@ gmx_set_thread_affinity(FILE                *fplog,
  
              /* sbuf1 contains rank info, while sbuf2 OpenMP thread info */
              sbuf1[0] = sbuf2[0] = '\0';
+            /* Only add rank info if we have more than one rank. */
+            if (cr->nnodes > 1)
+            {
  #ifdef GMX_MPI
  #ifdef GMX_THREAD_MPI
-            sprintf(sbuf1, "In thread-MPI thread #%d: ", cr->nodeid);
-#else       /* GMX_LIB_MPI */
-            sprintf(sbuf1, "In MPI process #%d: ", cr->nodeid);
+                sprintf(sbuf1, "In tMPI thread #%d: ", cr->nodeid);
+#else           /* GMX_LIB_MPI */
+                sprintf(sbuf1, "In MPI process #%d: ", cr->nodeid);
  #endif
-#endif      /* GMX_MPI */
+#endif          /* GMX_MPI */
+            }
  
              if (nthread_local > 1)
              {
-                sprintf(sbuf2, "of %d/%d thread%s ",
+                sprintf(sbuf2, "for %d/%d thread%s ",
                          nthread_local - nth_affinity_set, nthread_local,
-                        (nthread_local - nth_affinity_set) > 1 ? "s" : "");
+                        nthread_local > 1 ? "s" : "");
              }
  
              md_print_warn(NULL, fplog,
-                          "NOTE: %sAffinity setting %sfailed.\n"
-                          "      This can cause performance degradation!",
+                          "WARNING: %sAffinity setting %sfailed.\n"
+                          "         This can cause performance degradation! If you think your setting are\n"
+                          "         correct, contact the GROMACS developers.",
                            sbuf1, sbuf2);
          }
      }
+    return;
  }
  
  /* Check the process affinity mask and if it is found to be non-zero,
@@ -338,16 +376,53 @@ gmx_set_thread_affinity(FILE                *fplog,
   * Note that this will only work on Linux as we use a GNU feature.
   */
  void
-gmx_check_thread_affinity_set(FILE *fplog, const t_commrec *cr,
-                              gmx_hw_opt_t *hw_opt, int ncpus,
-                              gmx_bool bAfterOpenmpInit)
+gmx_check_thread_affinity_set(FILE            *fplog,
+                              const t_commrec *cr,
+                              gmx_hw_opt_t    *hw_opt,
+                              int  gmx_unused  nthreads_hw_avail,
+                              gmx_bool         bAfterOpenmpInit)
  {
-#ifdef HAVE_SCHED_GETAFFINITY
+#ifdef HAVE_SCHED_AFFINITY
      cpu_set_t mask_current;
      int       i, ret, cpu_count, cpu_set;
      gmx_bool  bAllSet;
+#endif
  
      assert(hw_opt);
+    if (!bAfterOpenmpInit)
+    {
+        /* Check for externally set OpenMP affinity and turn off internal
+         * pinning if any is found. We need to do this check early to tell
+         * thread-MPI whether it should do pinning when spawning threads.
+         * TODO: the above no longer holds, we should move these checks later
+         */
+        if (hw_opt->thread_affinity != threadaffOFF)
+        {
+            char *message;
+            if (!gmx_omp_check_thread_affinity(&message))
+            {
+                /* TODO: with -pin auto we should only warn when using all cores */
+                md_print_warn(cr, fplog, "%s", message);
+                sfree(message);
+                hw_opt->thread_affinity = threadaffOFF;
+            }
+        }
+
+        /* With thread-MPI this is needed as pinning might get turned off,
+         * which needs to be known before starting thread-MPI.
+         * With thread-MPI hw_opt is processed here on the master rank
+         * and passed to the other ranks later, so we only do this on master.
+         */
+        if (!SIMMASTER(cr))
+        {
+            return;
+        }
+#ifndef GMX_THREAD_MPI
+        return;
+#endif
+    }
+
+#ifdef HAVE_SCHED_GETAFFINITY
      if (hw_opt->thread_affinity == threadaffOFF)
      {
          /* internal affinity setting is off, don't bother checking process affinity */
@@ -369,19 +444,19 @@ gmx_check_thread_affinity_set(FILE *fplog, const t_commrec *cr,
       * detected CPUs is >= the CPUs in the current set.
       * We need to check for CPU_COUNT as it was added only in glibc 2.6. */
  #ifdef CPU_COUNT
-    if (ncpus < CPU_COUNT(&mask_current))
+    if (nthreads_hw_avail < CPU_COUNT(&mask_current))
      {
          if (debug)
          {
-            fprintf(debug, "%d CPUs detected, but %d was returned by CPU_COUNT",
-                    ncpus, CPU_COUNT(&mask_current));
+            fprintf(debug, "%d hardware threads detected, but %d was returned by CPU_COUNT",
+                    nthreads_hw_avail, CPU_COUNT(&mask_current));
          }
          return;
      }
  #endif /* CPU_COUNT */
  
      bAllSet = TRUE;
-    for (i = 0; (i < ncpus && i < CPU_SETSIZE); i++)
+    for (i = 0; (i < nthreads_hw_avail && i < CPU_SETSIZE); i++)
      {
          bAllSet = bAllSet && (CPU_ISSET(i, &mask_current) != 0);
      }
@@ -426,5 +501,5 @@ gmx_check_thread_affinity_set(FILE *fplog, const t_commrec *cr,
              fprintf(debug, "Default affinity mask found\n");
          }
      }
-#endif /* HAVE_SCHED_GETAFFINITY */
+#endif /* HAVE_SCHED_AFFINITY */
  }