Merge branch 'release-4-6'

[alexxy/gromacs.git] / CMakeLists.txt
diff --git a/CMakeLists.txt b/CMakeLists.txt

index 8db354047af569599ce12cf9bc8a4a265c94d662..ede6b0ee511ef8d7702c23d443caa572680b6bef 100644 (file)
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -145,7 +145,7 @@ if(NOT DEFINED GMX_CPU_ACCELERATION)
  endif(NOT DEFINED GMX_CPU_ACCELERATION)
  
  set(GMX_CPU_ACCELERATION "@GMX_SUGGESTED_CPU_ACCELERATION@"
-    CACHE STRING "Accelerated CPU kernels. Pick one of: None, SSE2, SSE4.1, AVX_128_FMA, AVX_256, IBM_QPX")
+    CACHE STRING "Accelerated CPU kernels. Pick one of: None, SSE2, SSE4.1, AVX_128_FMA, AVX_256, IBM_QPX, Sparc64_HPC_ACE")
  
  set(GMX_FFT_LIBRARY "fftw3" 
      CACHE STRING "FFT library choices: fftw3,mkl,fftpack[built-in]")
@@ -500,11 +500,13 @@ endif(GMX_X11)
  include(ThreadMPI)
  set(THREAD_MPI_LIB thread_mpi)
  if(GMX_THREAD_MPI)
-    tmpi_get_source_list(THREAD_MPI_SRC CXX)
+    tmpi_enable(CXX)
      set(PKG_CFLAGS "${PKG_CFLAGS} -DGMX_THREAD_MPI")
      set(GMX_MPI 1)
+    tmpi_get_source_list(THREAD_MPI_SRC)
  else(GMX_THREAD_MPI)
-    tmpi_get_source_list(THREAD_MPI_SRC CXX NOMPI)
+    tmpi_enable(CXX NOMPI)
+    tmpi_get_source_list(THREAD_MPI_SRC)
  endif(GMX_THREAD_MPI)
  
  if(GMX_GPU)
@@ -858,9 +860,10 @@ elseif(${GMX_CPU_ACCELERATION} STREQUAL "IBM_QPX")
      else()
          message(FATAL_ERROR "Cannot compile IBM QPX intrinsics without the XL compiler. If you are compiling for BlueGene/Q, use 'cmake .. -DCMAKE_TOOLCHAIN_FILE=BlueGeneQ-static-XL-C' to set up the tool chain.")
      endif()
-
+elseif(${GMX_CPU_ACCELERATION} STREQUAL "SPARC64_HPC_ACE")
+    set(GMX_CPU_ACCELERATION_SPARC64_HPC_ACE 1)
  else(${GMX_CPU_ACCELERATION} STREQUAL "NONE")
-    MESSAGE(FATAL_ERROR "Unrecognized option for accelerated kernels: ${GMX_CPU_ACCELERATION}. Pick one of None, SSE2, SSE4.1, AVX_128_FMA, AVX_256, IBM_QPX")
+    MESSAGE(FATAL_ERROR "Unrecognized option for accelerated kernels: ${GMX_CPU_ACCELERATION}. Pick one of None, SSE2, SSE4.1, AVX_128_FMA, AVX_256, IBM_QPX, Sparc64_HPC_ACE")
  endif(${GMX_CPU_ACCELERATION} STREQUAL "NONE")
  set(ACCELERATION_QUIETLY TRUE CACHE INTERNAL "")
  
@@ -912,11 +915,11 @@ if(${GMX_FFT_LIBRARY} STREQUAL "FFTW3")
  
      set(GMX_FFT_FFTW3 1)
  
-    if (NOT ${GMX_CPU_ACCELERATION} STREQUAL "NONE" AND NOT ${FFTW}_HAVE_SIMD) 
+    if ((${GMX_CPU_ACCELERATION} MATCHES "SSE" OR ${GMX_CPU_ACCELERATION} MATCHES "AVX") AND NOT ${FFTW}_HAVE_SIMD)
        message(WARNING "The fftw library found is compiled without SIMD support, which makes it slow. Consider recompiling it or contact your admin")
      endif()
  
-    if(NOT ${GMX_CPU_ACCELERATION} STREQUAL "NONE" AND ${FFTW}_HAVE_AVX)
+    if((${GMX_CPU_ACCELERATION} MATCHES "SSE" OR ${GMX_CPU_ACCELERATION} MATCHES "AVX") AND ${FFTW}_HAVE_AVX)
          # If we're not doing CPU acceleration, we don't care about FFTW performance on x86 either
          message(WARNING "The FFTW library was compiled with --enable-avx to enable AVX SIMD instructions. That might sound like a good idea for your processor, but for FFTW versions up to 3.3.3, these are slower than the SSE/SSE2 SIMD instructions for the way GROMACS uses FFTs. Limitations in the way FFTW allows GROMACS to measure performance make it awkward for either GROMACS or FFTW to make the decision for you based on runtime performance. You should compile a different FFTW library with --enable-sse or --enable-sse2. If you have a more recent FFTW, you may like to compare the performance of GROMACS with FFTW libraries compiled with and without --enable-avx. However, the GROMACS developers do not really expect the FFTW AVX optimization to help, because the performance is limited by memory access, not computation.")
      endif()