3 # This file is part of the GROMACS molecular simulation package.
5 # Copyright (c) 2020,2021, by the GROMACS development team, led by
6 # Mark Abraham, David van der Spoel, Berk Hess, and Erik Lindahl,
7 # and including many others, as listed in the AUTHORS file in the
8 # top-level source directory and at http://www.gromacs.org.
10 # GROMACS is free software; you can redistribute it and/or
11 # modify it under the terms of the GNU Lesser General Public License
12 # as published by the Free Software Foundation; either version 2.1
13 # of the License, or (at your option) any later version.
15 # GROMACS is distributed in the hope that it will be useful,
16 # but WITHOUT ANY WARRANTY; without even the implied warranty of
17 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
18 # Lesser General Public License for more details.
20 # You should have received a copy of the GNU Lesser General Public
21 # License along with GROMACS; if not, see
22 # http://www.gnu.org/licenses, or write to the Free Software Foundation,
23 # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
25 # If you want to redistribute modifications to GROMACS, please
26 # consider that scientific software is very special. Version
27 # control is crucial - bugs must be traceable. We will be happy to
28 # consider code for inclusion in the official distribution, but
29 # derived work must not be called official GROMACS. Details are found
30 # in the README & COPYING files - if they are missing, get the
31 # official version at http://www.gromacs.org.
33 # To help us fund GROMACS development, we humbly ask that you cite
34 # the research papers on the package. Check out http://www.gromacs.org.
36 """Building block based Dockerfile generation for CI testing images.
38 Generates a set of docker images used for running GROMACS CI on Gitlab.
39 The images are prepared according to a selection of build configuration targets
40 that hope to cover a broad enough scope of different possible systems,
41 allowing us to check compiler types and versions, as well as libraries used
42 for accelerators and parallel communication systems. Each combinations is
43 described as an entry in the build_configs dictionary, with the script
44 analysing the logic and adding build stages as needed.
46 Based on the example script provided by the NVidia HPCCM repository.
49 `NVidia HPC Container Maker <https://github.com/NVIDIA/hpc-container-maker>`__
52 * Paul Bauer <paul.bauer.q@gmail.com>
53 * Eric Irrgang <ericirrgang@gmail.com>
54 * Joe Jordan <e.jjordan12@gmail.com>
55 * Mark Abraham <mark.j.abraham@gmail.com>
59 $ python3 scripted_gmx_docker_builds.py --help
60 $ python3 scripted_gmx_docker_builds.py --format docker > Dockerfile && docker build .
61 $ python3 scripted_gmx_docker_builds.py | docker build -
71 from distutils.version import StrictVersion
75 from hpccm.building_blocks.base import bb_base
81 'This module assumes availability of supporting modules in the same directory. Add the directory to '
82 'PYTHONPATH or invoke Python from within the module directory so module location can be resolved.')
84 # Basic packages for all final images.
85 _common_packages = ['build-essential',
103 _opencl_extra_packages = [
105 # The following require apt_ppas=['ppa:intel-opencl/intel-opencl']
107 'ocl-icd-libopencl1',
108 'ocl-icd-opencl-dev',
110 # The following require
111 # apt_keys=['http://repo.radeon.com/rocm/apt/debian/rocm.gpg.key'],
112 # apt_repositories=['deb [arch=amd64] http://repo.radeon.com/rocm/apt/debian/ xenial main']
119 # Extra packages needed to build Python installations from source.
120 _python_extra_packages = ['build-essential',
139 # Extra packages needed for images for building documentation.
140 _docs_extra_packages = ['autoconf',
156 'texlive-latex-base',
157 'texlive-latex-extra',
158 'texlive-fonts-recommended',
159 'texlive-fonts-extra']
161 # Parse command line arguments
162 parser = argparse.ArgumentParser(description='GROMACS CI image creation script',
163 parents=[utility.parser])
165 parser.add_argument('--format', type=str, default='docker',
166 choices=['docker', 'singularity'],
167 help='Container specification format (default: docker)')
170 def base_image_tag(args) -> str:
171 # Check if we use CUDA images or plain linux images
172 if args.cuda is not None:
173 cuda_version_tag = 'nvidia/cuda:' + args.cuda + '-devel'
174 if args.centos is not None:
175 cuda_version_tag += '-centos' + args.centos
176 elif args.ubuntu is not None:
177 cuda_version_tag += '-ubuntu' + args.ubuntu
179 raise RuntimeError('Logic error: no Linux distribution selected.')
181 base_image_tag = cuda_version_tag
183 if args.centos is not None:
184 base_image_tag = 'centos:centos' + args.centos
185 elif args.ubuntu is not None:
186 base_image_tag = 'ubuntu:' + args.ubuntu
188 raise RuntimeError('Logic error: no Linux distribution selected.')
189 return base_image_tag
192 def get_llvm_packages(args) -> typing.Iterable[str]:
193 # If we use the package version of LLVM, we need to install extra packages for it.
194 if (args.llvm is not None) and (args.tsan is None):
195 return ['libomp-dev',
197 'clang-format-' + str(args.llvm),
198 'clang-tidy-' + str(args.llvm)]
202 def get_opencl_packages(args) -> typing.Iterable[str]:
203 if (args.doxygen is None) and (args.oneapi is None):
204 return _opencl_extra_packages
208 def get_compiler(args, compiler_build_stage: hpccm.Stage = None) -> bb_base:
210 if args.llvm is not None:
211 # Build our own version instead to get TSAN + OMP
212 if args.tsan is not None:
213 if compiler_build_stage is not None:
214 compiler = compiler_build_stage.runtime(_from='tsan')
216 raise RuntimeError('No TSAN compiler build stage!')
217 # Build the default compiler if we don't need special support
219 compiler = hpccm.building_blocks.llvm(extra_repository=True, version=args.llvm)
221 elif args.oneapi is not None:
222 if compiler_build_stage is not None:
223 compiler = compiler_build_stage.runtime(_from='oneapi')
224 # Prepare the toolchain (needed only for builds done within the Dockerfile, e.g.
225 # OpenMPI builds, which don't currently work for other reasons)
226 oneapi_toolchain = hpccm.toolchain(CC='/opt/intel/oneapi/compiler/latest/linux/bin/intel64/icx',
227 CXX='/opt/intel/oneapi/compiler/latest/linux/bin/intel64/icpx')
228 setattr(compiler, 'toolchain', oneapi_toolchain)
231 raise RuntimeError('No oneAPI compiler build stage!')
233 elif args.gcc is not None:
234 compiler = hpccm.building_blocks.gnu(extra_repository=True,
238 raise RuntimeError('Logic error: no compiler toolchain selected.')
242 def get_mpi(args, compiler):
243 # If needed, add MPI to the image
244 if args.mpi is not None:
245 if args.mpi == 'openmpi':
247 if args.cuda is not None:
250 if hasattr(compiler, 'toolchain'):
251 if args.oneapi is not None:
252 raise RuntimeError('oneAPI building OpenMPI is not supported')
253 return hpccm.building_blocks.openmpi(toolchain=compiler.toolchain, cuda=use_cuda, infiniband=False)
255 raise RuntimeError('compiler is not an HPCCM compiler building block!')
257 elif args.mpi == 'impi':
258 # TODO Intel MPI from the oneAPI repo is not working reliably,
259 # reasons are unclear. When solved, add packagages called:
260 # 'intel-oneapi-mpi', 'intel-oneapi-mpi-devel'
261 # during the compiler stage.
262 # TODO also consider hpccm's intel_mpi package if that doesn't need
264 raise RuntimeError('Intel MPI recipe not implemented yet.')
266 raise RuntimeError('Requested unknown MPI implementation.')
272 if (args.clfft is not None):
273 return hpccm.building_blocks.generic_cmake(
274 repository='https://github.com/clMathLibraries/clFFT.git',
275 prefix='/usr/local', recursive=True, branch=args.clfft, directory='clFFT/src')
280 def add_tsan_compiler_build_stage(input_args, output_stages: typing.Mapping[str, hpccm.Stage]):
281 """Isolate the expensive TSAN preparation stage.
283 This is a very expensive stage, but has few and disjoint dependencies, and
284 its output is easily compartmentalized (/usr/local) so we can isolate this
285 build stage to maximize build cache hits and reduce rebuild time, bookkeeping,
286 and final image size.
288 if not isinstance(output_stages, collections.abc.MutableMapping):
289 raise RuntimeError('Need output_stages container.')
290 tsan_stage = hpccm.Stage()
291 tsan_stage += hpccm.primitives.baseimage(image=base_image_tag(input_args), _as='tsan')
293 tsan_stage += hpccm.building_blocks.packages(ospackages=['git', 'ca-certificates', 'build-essential', 'cmake'])
294 # CMake will get duplicated later, but this is an expensive image, and it isn't worth optimizing
295 # out that duplication...
296 tsan_stage += hpccm.building_blocks.python(python3=True, python2=False, devel=False)
298 compiler_branch = 'release/' + str(input_args.llvm) + '.x'
299 tsan_stage += hpccm.building_blocks.generic_cmake(
300 repository='https://github.com/llvm/llvm-project.git',
301 directory='/var/tmp/llvm-project/llvm/',
302 prefix='/usr/local', recursive=True, branch=compiler_branch,
303 cmake_opts=['-D CMAKE_BUILD_TYPE=Release', '-D LLVM_ENABLE_PROJECTS="clang;openmp;clang-tools-extra;compiler-rt;lld"',
304 '-D LIBOMP_TSAN_SUPPORT=on'],
305 postinstall=['ln -s /usr/local/bin/clang++ /usr/local/bin/clang++-' + str(input_args.llvm),
306 'ln -s /usr/local/bin/clang-format /usr/local/bin/clang-format-' + str(input_args.llvm),
307 'ln -s /usr/local/bin/clang-tidy /usr/local/bin/clang-tidy-' + str(input_args.llvm),
308 'ln -s /usr/local/share/clang/run-clang-tidy.py /usr/local/bin/run-clang-tidy-' + str(input_args.llvm) + '.py',
309 'ln -s /usr/local/bin/run-clang-tidy-' + str(input_args.llvm) + '.py /usr/local/bin/run-clang-tidy-' + str(input_args.llvm),
310 'ln -s /usr/local/libexec/c++-analyzer /usr/local/bin/c++-analyzer-' + str(input_args.llvm)])
311 output_stages['compiler_build'] = tsan_stage
313 def oneapi_runtime(_from='0'):
314 oneapi_runtime_stage = hpccm.Stage()
315 oneapi_runtime_stage += hpccm.primitives.copy(_from='oneapi-build',
316 files={"/opt/intel": "/opt/intel",
317 "/etc/bash.bashrc": "/etc/bash.bashrc"})
318 return oneapi_runtime_stage
320 def add_oneapi_compiler_build_stage(input_args, output_stages: typing.Mapping[str, hpccm.Stage]):
321 """Isolate the oneAPI preparation stage.
323 This stage is isolated so that its installed components are minimized in the
324 final image (chiefly /opt/intel) and its environment setup script can be
325 sourced. This also helps with rebuild time and final image size.
327 if not isinstance(output_stages, collections.abc.MutableMapping):
328 raise RuntimeError('Need output_stages container.')
329 oneapi_stage = hpccm.Stage()
330 oneapi_stage += hpccm.primitives.baseimage(image=base_image_tag(input_args), _as='oneapi-build')
332 version = str(input_args.oneapi)
334 # Add required components for the next stage (both for hpccm and Intel's setvars.sh script)
335 oneapi_stage += hpccm.building_blocks.packages(ospackages=['wget', 'gnupg2', 'ca-certificates', 'lsb-release'])
336 oneapi_stage += hpccm.building_blocks.packages(
337 apt_keys=['https://apt.repos.intel.com/intel-gpg-keys/GPG-PUB-KEY-INTEL-SW-PRODUCTS-2023.PUB'],
338 apt_repositories=['deb https://apt.repos.intel.com/oneapi all main'],
339 # Add minimal packages (not the whole HPC toolkit!)
340 ospackages=[f'intel-oneapi-dpcpp-cpp-{version}',
341 f'intel-oneapi-openmp-{version}',
342 f'intel-oneapi-mkl-{version}',
343 f'intel-oneapi-mkl-devel-{version}']
345 # Ensure that all bash shells on the final container will have access to oneAPI
346 oneapi_stage += hpccm.primitives.shell(
347 commands=['echo "source /opt/intel/oneapi/setvars.sh" >> /etc/bash.bashrc']
349 setattr(oneapi_stage, 'runtime', oneapi_runtime)
351 output_stages['compiler_build'] = oneapi_stage
353 def prepare_venv(version: StrictVersion) -> typing.Sequence[str]:
354 """Get shell commands to set up the venv for the requested Python version."""
355 major = version.version[0]
356 minor = version.version[1] # type: int
358 pyenv = '$HOME/.pyenv/bin/pyenv'
360 py_ver = f'{major}.{minor}'
361 venv_path = f'$HOME/venv/py{py_ver}'
362 commands = [f'$({pyenv} prefix `{pyenv} whence python{py_ver}`)/bin/python -m venv {venv_path}']
364 commands.append(f'{venv_path}/bin/python -m pip install --upgrade pip setuptools')
365 # Install dependencies for building and testing gmxapi Python package.
366 # WARNING: Please keep this list synchronized with python_packaging/requirements-test.txt
367 # TODO: Get requirements.txt from an input argument.
368 commands.append(f"""{venv_path}/bin/python -m pip install --upgrade \
377 'scikit-build>=0.10'""")
379 # TODO: Remove 'importlib_resources' dependency when Python >=3.7 is required.
381 commands.append(f"""{venv_path}/bin/python -m pip install --upgrade \
382 'importlib_resources'""")
387 def add_python_stages(building_blocks: typing.Mapping[str, bb_base],
389 output_stages: typing.MutableMapping[str, hpccm.Stage]):
390 """Add the stage(s) necessary for the requested venvs.
392 One intermediate build stage is created for each venv (see --venv option).
394 Each stage partially populates Python installations and venvs in the home
395 directory. The home directory is collected by the 'pyenv' stage for use by
396 the main build stage.
398 if len(input_args.venvs) < 1:
399 raise RuntimeError('No venvs to build...')
400 if output_stages is None or not isinstance(output_stages, collections.abc.Mapping):
401 raise RuntimeError('Need a container for output stages.')
403 # Main Python stage that collects the environments from individual stages.
404 # We collect the stages individually, rather than chaining them, because the
405 # copy is a bit slow and wastes local Docker image space for each filesystem
407 pyenv_stage = hpccm.Stage()
408 pyenv_stage += hpccm.primitives.baseimage(image=base_image_tag(input_args), _as='pyenv')
409 pyenv_stage += building_blocks['compiler']
410 pyenv_stage += building_blocks['mpi']
411 pyenv_stage += hpccm.building_blocks.packages(ospackages=_python_extra_packages)
413 for version in [StrictVersion(py_ver) for py_ver in sorted(input_args.venvs)]:
414 stage_name = 'py' + str(version)
415 stage = hpccm.Stage()
416 stage += hpccm.primitives.baseimage(image=base_image_tag(input_args), _as=stage_name)
417 stage += building_blocks['compiler']
418 stage += building_blocks['mpi']
419 stage += hpccm.building_blocks.packages(ospackages=_python_extra_packages)
421 # TODO: Use a non-root user for testing and Python virtual environments.
422 stage += hpccm.primitives.shell(commands=[
423 'curl https://pyenv.run | bash',
424 """echo 'export PYENV_ROOT="$HOME/.pyenv"' >> $HOME/.bashrc""",
425 """echo 'export PATH="$PYENV_ROOT/bin:$PATH"' >> $HOME/.bashrc""",
426 """echo 'eval "$(pyenv init -)"' >> $HOME/.bashrc""",
427 """echo 'eval "$(pyenv virtualenv-init -)"' >> $HOME/.bashrc"""])
428 pyenv = '$HOME/.pyenv/bin/pyenv'
429 commands = [f'PYTHON_CONFIGURE_OPTS="--enable-shared" {pyenv} install -s {version}']
430 stage += hpccm.primitives.shell(commands=commands)
432 commands = prepare_venv(version)
433 stage += hpccm.primitives.shell(commands=commands)
435 # TODO: Update user home directory.
436 pyenv_stage += hpccm.primitives.copy(_from=stage_name, _mkdir=True, src=['/root/'],
439 # Add the intermediate build stage to the sequence
440 output_stages[stage_name] = stage
442 # TODO: If we activate pyenv for login shells, the `global` "version" should be full-featured.
443 # # `version` should be a system installation or pyenv environment (or pyenv-virtualenv)
444 # # with the dependencies for all of the Python aspects of CMake-driven builds.
445 # commands = '{pyenv} global {version}'.format(
448 # pyenv_stage += hpccm.primitives.shell(commands=commands)
450 # Add the aggregating build stage to the sequence. This allows the main stage to copy
451 # the files in a single stage, potentially reducing the overall output image size.
452 output_stages['pyenv'] = pyenv_stage
455 def add_documentation_dependencies(input_args,
456 output_stages: typing.MutableMapping[str, hpccm.Stage]):
457 """Add appropriate layers according to doxygen input arguments."""
458 if input_args.doxygen is None:
460 output_stages['main'] += hpccm.primitives.shell(
461 commands=['sed -i \'/\"XPS\"/d;/\"PDF\"/d;/\"PS\"/d;/\"EPS\"/d;/disable ghostscript format types/d\' /etc/ImageMagick-6/policy.xml'])
462 output_stages['main'] += hpccm.building_blocks.pip(pip='pip3', packages=['sphinx==1.6.1', 'gcovr'])
463 if input_args.doxygen == '1.8.5':
464 doxygen_commit = 'ed4ed873ab0e7f15116e2052119a6729d4589f7a'
465 output_stages['main'] += hpccm.building_blocks.generic_autotools(
466 repository='https://github.com/westes/flex.git',
467 commit='f7788a9a0ecccdc953ed12043ccb59ca25714018',
468 prefix='/tmp/install-of-flex',
469 configure_opts=['--disable-shared'],
470 preconfigure=['./autogen.sh'])
471 output_stages['main'] += hpccm.building_blocks.generic_autotools(
472 repository='https://github.com/doxygen/doxygen.git',
473 commit=doxygen_commit,
476 '--flex /tmp/install-of-flex/bin/flex',
479 version = input_args.doxygen
480 archive_name = f'doxygen-{version}.linux.bin.tar.gz'
481 archive_url = f'https://sourceforge.net/projects/doxygen/files/rel-{version}/{archive_name}'
482 binary_path = f'doxygen-{version}/bin/doxygen'
484 'mkdir doxygen && cd doxygen',
485 f'wget {archive_url}',
486 f'tar xf {archive_name} {binary_path}',
487 f'cp {binary_path} /usr/local/bin/',
488 'cd .. && rm -rf doxygen'
490 output_stages['main'] += hpccm.primitives.shell(commands=commands)
493 def build_stages(args) -> typing.Iterable[hpccm.Stage]:
494 """Define and sequence the stages for the recipe corresponding to *args*."""
496 # A Dockerfile or Singularity recipe can have multiple build stages.
497 # The main build stage can copy files from previous stages, though only
498 # the last stage is included in the tagged output image. This means that
499 # large or expensive sets of build instructions can be isolated in
500 # local/temporary images, but all of the stages need to be output by this
501 # script, and need to occur in the correct order, so we create a sequence
502 # object early in this function.
503 stages = collections.OrderedDict()
505 # If we need TSAN or oneAPI support the early build is more complex,
506 # so that our compiler images don't have all the cruft needed to get those things
508 if args.llvm is not None and args.tsan is not None:
509 add_tsan_compiler_build_stage(input_args=args, output_stages=stages)
510 if args.oneapi is not None:
511 add_oneapi_compiler_build_stage(input_args=args, output_stages=stages)
513 # Building blocks are chunks of container-builder instructions that can be
514 # copied to any build stage with the addition operator.
515 building_blocks = collections.OrderedDict()
516 building_blocks['base_packages'] = hpccm.building_blocks.packages(
517 ospackages=_common_packages)
519 # These are the most expensive and most reusable layers, so we put them first.
520 building_blocks['compiler'] = get_compiler(args, compiler_build_stage=stages.get('compiler_build'))
521 building_blocks['mpi'] = get_mpi(args, building_blocks['compiler'])
522 for i, cmake in enumerate(args.cmake):
523 building_blocks['cmake' + str(i)] = hpccm.building_blocks.cmake(
525 prefix=f'/usr/local/cmake-{cmake}',
528 # Install additional packages early in the build to optimize Docker build layer cache.
529 os_packages = list(get_llvm_packages(args)) + get_opencl_packages(args)
530 if args.doxygen is not None:
531 os_packages += _docs_extra_packages
532 if args.oneapi is not None:
533 os_packages += ['lsb-release']
534 building_blocks['extra_packages'] = hpccm.building_blocks.packages(
535 ospackages=os_packages,
536 apt_ppas=['ppa:intel-opencl/intel-opencl'],
537 apt_keys=['http://repo.radeon.com/rocm/apt/debian/rocm.gpg.key'],
538 apt_repositories=['deb [arch=amd64] http://repo.radeon.com/rocm/apt/debian/ xenial main']
541 building_blocks['clfft'] = get_clfft(args)
543 # Add Python environments to MPI images, only, so we don't have to worry
544 # about whether to install mpi4py.
545 if args.mpi is not None and len(args.venvs) > 0:
546 add_python_stages(building_blocks=building_blocks, input_args=args, output_stages=stages)
548 # Create the stage from which the targeted image will be tagged.
549 stages['main'] = hpccm.Stage()
551 stages['main'] += hpccm.primitives.baseimage(image=base_image_tag(args))
552 for bb in building_blocks.values():
556 # We always add Python3 and Pip
557 stages['main'] += hpccm.building_blocks.python(python3=True, python2=False, devel=True)
558 stages['main'] += hpccm.building_blocks.pip(upgrade=True, pip='pip3',
559 packages=['pytest', 'networkx', 'numpy'])
561 # Add documentation requirements (doxygen and sphinx + misc).
562 if args.doxygen is not None:
563 add_documentation_dependencies(args, stages)
565 if 'pyenv' in stages and stages['pyenv'] is not None:
566 stages['main'] += hpccm.primitives.copy(_from='pyenv', _mkdir=True, src=['/root/.pyenv/'],
568 stages['main'] += hpccm.primitives.copy(_from='pyenv', _mkdir=True, src=['/root/venv/'],
570 # TODO: Update user home directory.
571 # TODO: If we activate pyenv for login shells, the `global` "version" should be full-featured.
572 # stages['main'] += hpccm.primitives.copy(_from='pyenv', src=['/root/.bashrc'],
575 # Make sure that `python` resolves to something.
576 stages['main'] += hpccm.primitives.shell(commands=['test -x /usr/bin/python || '
577 'update-alternatives --install /usr/bin/python python /usr/bin/python3 1 && '
578 '/usr/bin/python --version'])
580 # Note that the list of stages should be sorted in dependency order.
581 for build_stage in stages.values():
582 if build_stage is not None:
586 if __name__ == '__main__':
587 args = parser.parse_args()
589 # Set container specification output format
590 hpccm.config.set_container_format(args.format)
592 container_recipe = build_stages(args)
594 # Output container specification
595 for stage in container_recipe: