aws-ofi-rccl/1.4.0-cpeGNU-22.12-rocm-5.3.2 (aws-ofi-rccl-1.4.0-cpeGNU-22.12-rocm-5.3.2.eb)
This software is archived in the LUMI-EasyBuild-contrib GitHub repository as easybuild/easyconfigs/__archive__/a/aws-ofi-rccl/aws-ofi-rccl-1.4.0-cpeGNU-22.12-rocm-5.3.2.eb. The corresponding module would be aws-ofi-rccl/1.4.0-cpeGNU-22.12-rocm-5.3.2.
easyblock = 'ConfigureMake'
name = 'aws-ofi-rccl'
# The version according to https://github.com/ROCmSoftwarePlatform/aws-ofi-rccl/blob/cxi/RELEASENOTES.md
version = '1.4.0'
versionsuffix = '-rocm-5.2.3'
homepage = 'https://github.com/ROCmSoftwarePlatform/aws-ofi-rccl'
whatis = [
'Description: AWS OFI RCCL is a plug-in which enables EC2 developers to use libfabric as a network provider.'
]
description = """
Machine learning frameworks running on top of AMD GPUs use a library called
RCCL which provides standard collective communication routines for an arbitrary
number of GPUs installed across single or multiple nodes.
This module implements a plug-in which maps RCCLs connection-oriented transport
APIs to libfabric's connection-less reliable interface. This allows RCCL
applications to take benefit of libfabric's transport layer services like
reliable message support and operating system bypass.
"""
software_license_urls = ['https://github.com/ROCmSoftwarePlatform/aws-ofi-rccl/blob/cxi/LICENSE']
# The plugin build needs access to MPI directory
toolchain = {'name': 'cpeGNU', 'version': '22.12'}
sources = [{
'filename': '%(name)s-%(version)s.tar.gz',
'git_config': {
'url': 'https://github.com/ROCmSoftwarePlatform',
'repo_name': '%(name)s',
'commit': '52cbc4766401be4410fd0aa5207f2f9b6226c321',
}
}]
builddependencies = [
('buildtools', '%(toolchain_version)s', '', True),
]
dependencies = [
('rocm/5.2.3', 'EXTERNAL_MODULE'),
]
preconfigopts = ' ./autogen.sh && '
configopts = (
' --with-libfabric=/opt/cray/libfabric/$(pkg-config --modversion libfabric) '
' --with-hip=$ROCM_PATH/hip '
' --with-rccl=$ROCM_PATH/rccl '
)
sanity_check_paths = {
'files': ['lib/librccl-net.so.0.0.0'],
'dirs': ['bin', 'lib']
}
moduleclass = 'devel'