modified: c/CUDAcore/CUDAcore-11.6.0.eb

new file:   f/FFTW/FFTW-3.3.10-NVHPC-23.5-CUDA-12.2.0.eb
	new file:   n/NCCL/NCCL-2.16.2-GCCcore-12.2.0-CUDA-12.2.0.eb
	modified:   n/NVHPC/NVHPC-22.2.eb
	new file:   o/OpenMPI/OpenMPI-4.1.5-NVHPC-23.5-CUDA-12.2.0.eb
	new file:   p/Perl/Perl-5.34.1-GCCcore-11.3.0.eb
	modified:   p/pkg-config/pkg-config-0.29.2.eb
	new file:   p/pkgconf/pkgconf-1.8.0-GCCcore-12.2.0.eb
	new file:   u/UCC-CUDA/UCC-CUDA-1.1.0-GCCcore-12.2.0-CUDA-12.2.0.eb
	new file:   u/UCX-CUDA/UCX-CUDA-1.14.0-GCCcore-12.2.0-CUDA-12.2.0.eb
This commit is contained in:
Lukas Krupcik 2023-08-08 09:24:57 +02:00
parent c629361037
commit b88bcade3e
10 changed files with 2255 additions and 0 deletions

View File

@ -17,5 +17,6 @@ toolchain = SYSTEM
source_urls = ['https://developer.download.nvidia.com/compute/cuda/%(version)s/local_installers/']
sources = ['cuda_%%(version)s_%s_linux%%(cudaarch)s.run' % local_nv_version]
checksums = ['1783da6d63970786040980b57fa3cb6420142159fc7d0e66f8f05c4905d98c83']
moduleclass = 'system'

View File

@ -0,0 +1,27 @@
# IT4Innovations
# LK 2023
name = 'FFTW'
version = '3.3.10'
homepage = 'https://www.fftw.org'
description = """FFTW is a C subroutine library for computing the discrete Fourier transform (DFT)
in one or more dimensions, of arbitrary input size, and of both real and complex data."""
toolchain = {'name': 'NVHPC', 'version': '23.5'}
toolchainopts = {'pic': True}
source_urls = [homepage]
sources = [SOURCELOWER_TAR_GZ]
checksums = ['56c932549852cddcfafdab3820b0200c7742675be92179e59e6215b340e26467']
dependencies = [
('CUDA', '12.2.0', '', True),
]
# Does not work with nvc
with_quad_prec = False
runtest = 'check'
moduleclass = 'numlib'

View File

@ -0,0 +1,29 @@
# IT4Innovations
# LK 2023
name = 'NCCL'
version = '2.16.2'
versionsuffix = '-CUDA-%(cudaver)s'
homepage = 'https://developer.nvidia.com/nccl'
description = """The NVIDIA Collective Communications Library (NCCL) implements multi-GPU and multi-node collective
communication primitives that are performance optimized for NVIDIA GPUs."""
toolchain = {'name': 'GCCcore', 'version': '12.2.0'}
github_account = 'NVIDIA'
source_urls = [GITHUB_SOURCE]
sources = ['v%(version)s-1.tar.gz']
checksums = ['7f7c738511a8876403fc574d13d48e7c250d934d755598d82e14bab12236fc64']
builddependencies = [('binutils', '2.39')]
dependencies = [
('CUDA', '12.2.0', '', SYSTEM),
('UCX-CUDA', '1.13.1', versionsuffix),
]
# default CUDA compute capabilities to use (override via --cuda-compute-capabilities)
cuda_compute_capabilities = ['5.0', '6.0', '7.0', '7.5', '8.0', '8.6', '9.0']
moduleclass = 'lib'

View File

@ -14,6 +14,7 @@ accept_eula = True
source_urls = ['https://developer.download.nvidia.com/hpc-sdk/%(version)s/']
local_tarball_tmpl = 'nvhpc_2022_%%(version_major)s%%(version_minor)s_Linux_%s_cuda_multi.tar.gz'
sources = [local_tarball_tmpl % '%(arch)s']
checksums = ['8dfb4007d6912b2722946358ac69409592c1f03426d81971ffbcb6fc5fea2cb8']
local_gccver = '10.2.0'
dependencies = [

View File

@ -0,0 +1,109 @@
# IT4Innovations
# LK 2023
name = 'OpenMPI'
version = '4.1.5'
homepage = 'https://www.open-mpi.org/'
description = """The Open MPI Project is an open source MPI-3 implementation."""
toolchain = {'name': 'NVHPC', 'version': '23.5'}
source_urls = ['https://www.open-mpi.org/software/ompi/v%(version_major_minor)s/downloads']
sources = [SOURCELOWER_TAR_BZ2]
patches = [
'OpenMPI-4.1.1_build-with-internal-cuda-header.patch',
'OpenMPI-4.1.1_opal-datatype-cuda-performance.patch',
]
checksums = [
'a640986bc257389dd379886fdae6264c8cfa56bc98b71ce3ae3dfbd8ce61dbe3', # openmpi-4.1.5.tar.bz2
# OpenMPI-4.1.1_build-with-internal-cuda-header.patch
'63eac52736bdf7644c480362440a7f1f0ae7c7cae47b7565f5635c41793f8c83',
# OpenMPI-4.1.1_opal-datatype-cuda-performance.patch
'b767c7166cf0b32906132d58de5439c735193c9fd09ec3c5c11db8d5fa68750e',
]
#builddependencies = [
# ('pkgconf', '1.9.3'),
# ('Perl', '5.36.0'),
# ('Autotools', '20220317'),
#]
dependencies = [
# ('zlib', '1.2.12'),
('CUDA', '12.2.0', '', True),
# ('hwloc', '2.8.0'),
# ('libevent', '2.1.12'),
('UCX', '1.14.0'),
# ('UCX-CUDA', '1.14.0', '-CUDA-%(cudaver)s'),
# ('libfabric', '1.16.1'),
# ('PMIx', '4.2.2'),
# ('UCC', '1.1.0'),
# ('UCC-CUDA', '1.1.0', '-CUDA-%(cudaver)s'),
]
# Update configure to include changes from the "internal-cuda" patch
# by running a subset of autogen.pl sufficient to achieve this
# without doing the full, long-running regeneration.
preconfigopts = ' && '.join([
'cd config',
'autom4te --language=m4sh opal_get_version.m4sh -o opal_get_version.sh',
'cd ..',
'autoconf',
'autoheader',
'aclocal',
'automake',
''
])
# CUDA related patches and custom configure option can be removed if CUDA support isn't wanted.
configopts = ' --with-cuda=internal'
configopts += ' CC=pgcc CXX=pgc++ FC=pgfortran'
configopts += ' CXXFLAGS="-fPIC"'
# IT4I-specific settings
#configopts += '--enable-shared '
configopts += ' --enable-mpi-thread-multiple'
configopts += ' --with-verbs'
configopts += ' --enable-mpirun-prefix-by-default'
configopts += ' --with-hwloc=$EBROOTHWLOC' # hwloc support
configopts = '--with-slurm ' # Enable slurm
configopts += ' --enable-mpi-cxx' # Enable building the C++ MPI bindings
configopts += ' --with-ucx=$EBROOTUCX'
osdependencies = [('libibverbs-dev', 'libibverbs-devel', 'rdma-core-devel')]
postinstallcmds = [
'echo "# By default, for Open MPI 4.0 and later, infiniband ports on a device are not used by default." >> %(installdir)s/etc/openmpi-mca-params.conf',
'echo "btl_openib_allow_ib = true" >> %(installdir)s/etc/openmpi-mca-params.conf',
]
local_libs = ["mpi_mpifh", "mpi", "ompitrace", "open-pal", "open-rte"]
sanity_check_paths = {
'files': [
"bin/%s" %
binfile for binfile in [
"ompi_info", "opal_wrapper", "orterun"]] + [
"lib/lib%s.%s" %
(libfile, SHLIB_EXT) for libfile in local_libs] + [
"include/%s.h" %
x for x in [
"mpi-ext", "mpif-config", "mpif", "mpi", "mpi_portable_platform"]], 'dirs': [], }
import os
if os.environ.get("CLUSTERNAME") in ["BARBORA"]:
modextravars = {'OMPI_MCA_btl_openib_if_include': 'mlx5_0',
'OMPI_MCA_btl_tcp_if_include': '10.33.4.0/24',
'OMPI_MCA_orte_base_help_aggregate': '0',
}
elif os.environ.get("CLUSTERNAME") in ["KAROLINA"]:
modextravars = {'OMPI_MCA_btl_openib_if_include': 'mlx5_0',
'OMPI_MCA_orte_base_help_aggregate': '0',
}
else:
modextravars = {'OMPI_MCA_btl_openib_if_include': 'mlx4_0',
'OMPI_MCA_oob_tcp_if_include': '10.0.0.0/8',
}
moduleclass = 'mpi'

File diff suppressed because it is too large Load Diff

View File

@ -16,6 +16,7 @@ toolchain = SYSTEM
sources = [SOURCELOWER_TAR_GZ]
source_urls = ['http://pkgconfig.freedesktop.org/releases/']
checksums = ['6fc69c01688c9458a57eb9a1664c9aba372ccda420a02bf4429fe610e7e7d591']
configopts = " --with-internal-glib"

View File

@ -0,0 +1,34 @@
# IT4Innovations
# LK 2023
easyblock = 'ConfigureMake'
name = 'pkgconf'
version = '1.8.0'
homepage = 'https://github.com/pkgconf/pkgconf'
description = """pkgconf is a program which helps to configure compiler and linker flags for development libraries.
It is similar to pkg-config from freedesktop.org."""
toolchain = {'name': 'GCCcore', 'version': '12.2.0'}
source_urls = ['https://distfiles.ariadne.space/pkgconf/']
sources = [SOURCELOWER_TAR_GZ]
checksums = ['d7b6fdb522d81c11f5a0e0a0629a9f5480809ec90e595058674c1517822dfb8c']
builddependencies = [('binutils', '2.39')]
postinstallcmds = ["cd %(installdir)s/bin && ln -s pkgconf pkg-config"]
sanity_check_paths = {
'files': ['bin/pkg-config', 'bin/pkgconf'],
'dirs': [],
}
sanity_check_commands = [
"pkg-config --help",
"pkgconf --help",
]
moduleclass = 'devel'

View File

@ -0,0 +1,60 @@
# IT4Innovations
# LK 2023
easyblock = 'ConfigureMake'
name = 'UCC-CUDA'
version = '1.1.0'
versionsuffix = '-CUDA-%(cudaver)s'
homepage = 'https://www.openucx.org/'
description = """UCC (Unified Collective Communication) is a collective
communication operations API and library that is flexible, complete, and
feature-rich for current and emerging programming models and runtimes.
This module adds the UCC CUDA support.
"""
toolchain = {'name': 'GCCcore', 'version': '12.2.0'}
toolchainopts = {'pic': True}
source_urls = ['https://github.com/openucx/ucc/archive/refs/tags']
sources = ['v%(version)s.tar.gz']
patches = [
'%(name)s-1.0.0_link_against_existing_UCC_libs.patch',
'%(name)s-%(version)s_cuda_12_mem_ops.patch',
]
checksums = [
{'v1.1.0.tar.gz': '74c8ba75037b5bd88cb703e8c8ae55639af3fecfd4428912a433c010c97b4df7'},
{'UCC-CUDA-1.0.0_link_against_existing_UCC_libs.patch':
'9fa11cf6779174f4e9048df5812096e4261e1769d465cc7f34a6354398876856'},
{'UCC-CUDA-1.1.0_cuda_12_mem_ops.patch': 'fc3ea1487d29dc626db2363ef5a79e7f0906f6a7507a363fa6167a812b143eb6'},
]
builddependencies = [
('binutils', '2.39'),
('Autotools', '20220317'),
]
dependencies = [
('UCC', '1.1.0'),
('CUDA', '12.2.0', '', SYSTEM),
('UCX-CUDA', '1.13.1', '-CUDA-%(cudaver)s'),
('NCCL', '2.16.2', '-CUDA-%(cudaver)s'),
]
preconfigopts = "./autogen.sh && "
buildopts = '-C src/components/mc/cuda V=1 && make -C src/components/tl/nccl V=1'
installopts = '-C src/components/mc/cuda && make -C src/components/tl/nccl install'
sanity_check_paths = {
'files': ['lib/ucc/libucc_mc_cuda.%s' % SHLIB_EXT, 'lib/ucc/libucc_tl_nccl.%s' % SHLIB_EXT],
'dirs': ['lib']
}
sanity_check_commands = ["ucc_info -c"]
modextrapaths = {'EB_UCC_EXTRA_COMPONENT_PATH': 'lib/ucc'}
moduleclass = 'lib'

View File

@ -0,0 +1,44 @@
# IT4Innovations
# LK 2023
easyblock = 'EB_UCX_Plugins'
name = 'UCX-CUDA'
version = '1.14.0'
versionsuffix = '-CUDA-%(cudaver)s'
homepage = 'http://www.openucx.org/'
description = """Unified Communication X
An open-source production grade communication framework for data centric
and high-performance applications
This module adds the UCX CUDA support.
"""
toolchain = {'name': 'GCCcore', 'version': '12.2.0'}
toolchainopts = {'pic': True}
source_urls = ['https://github.com/openucx/ucx/releases/download/v%(version)s']
sources = [{'filename': 'ucx-%(version)s.tar.gz', 'alt_location': 'UCX'}]
patches = ['%(name)s-1.11.0_link_against_existing_UCX_libs.patch']
checksums = [
('457187fa020e526609ba91e7750c9941d57bd57d60d6eed317b40ad8824aca93',
'9bd95e2059de5dece9dddd049aacfca3d21bfca025748a6a0b1be4486e28afdd'), # ucx-1.14.0.tar.gz
{'UCX-CUDA-1.11.0_link_against_existing_UCX_libs.patch':
'457187fa020e526609ba91e7750c9941d57bd57d60d6eed317b40ad8824aca93'},
]
builddependencies = [
('binutils', '2.39'),
('Autotools', '20220317'),
('pkgconf', '1.9.3'),
]
dependencies = [
('zlib', '1.2.12'),
('UCX', '1.14.0'),
('CUDA', '12.2.0', '', SYSTEM),
('GDRCopy', '2.3'),
]
moduleclass = 'lib'