diff --git a/Golden_Repo/o/OpenMPI-settings/OpenMPI-settings-4.1-CUDA-UCC.eb b/Golden_Repo/o/OpenMPI-settings/OpenMPI-settings-4.1-CUDA-UCC.eb new file mode 100644 index 0000000000000000000000000000000000000000..d4ef0f56e1e3c0b897e1c18d4394c10893e4f75e --- /dev/null +++ b/Golden_Repo/o/OpenMPI-settings/OpenMPI-settings-4.1-CUDA-UCC.eb @@ -0,0 +1,55 @@ +easyblock = 'SystemBundle' + +name = 'OpenMPI-settings' +version = '4.1' +versionsuffix = 'CUDA-UCC' + +homepage = '' +description = '''This module loads the default OpenMPI configuration. It relies on UCX and enables the UCX CUDA +transports. It also rely on UCC for collectives. +''' + +toolchain = SYSTEM + +source_urls = [] + +sources = [] +modextravars = { + 'SLURM_MPI_TYPE': 'pspmix', + 'OMPI_MCA_mca_base_component_show_load_errors': '1', + 'OMPI_MCA_mpi_param_check': '1', + 'OMPI_MCA_mpi_show_handle_leaks': '1', + 'OMPI_MCA_mpi_warn_on_fork': '1', + # Disable uct for the time being due to: + # https://github.com/openucx/ucx/wiki/OpenMPI-and-OpenSHMEM-installation-with-UCX#running-open-mpi-with-ucx + # Also openib, since it is deprecated and should be substituted by the UCX support in the pml + 'OMPI_MCA_btl': '^uct,openib', + 'OMPI_MCA_btl_openib_allow_ib': '1', + 'OMPI_MCA_bml_r2_show_unreach_errors': '0', + 'OMPI_MCA_coll_ucc_priority': '80', + 'OMPI_MCA_coll_ucc_enable': '1', + 'OMPI_MCA_pml': 'ucx', + 'OMPI_MCA_osc': '^rdma', + 'OMPI_MCA_opal_abort_print_stack': '1', + 'OMPI_MCA_opal_set_max_sys_limits': '1', + 'OMPI_MCA_opal_event_include': 'epoll', + 'OMPI_MCA_btl_openib_warn_default_gid_prefix': '0', + # OMPIO does not seem to work reliably on our system + 'OMPI_MCA_io': 'romio321', +} + +modluafooter = ''' +if mode()=="load" then + if isloaded("UCX-settings/RC") then + try_load("UCX-settings/RC-CUDA") + elseif isloaded("UCX-settings/UD") then + try_load("UCX-settings/UD-CUDA") + elseif isloaded("UCX-settings/DC") then + try_load("UCX-settings/DC-CUDA") + elseif not isloaded("UCX-settings") then + try_load("UCX-settings/RC-CUDA") + end +end +''' + +moduleclass = 'system' diff --git a/Golden_Repo/o/OpenMPI-settings/OpenMPI-settings-4.1-CUDA.eb b/Golden_Repo/o/OpenMPI-settings/OpenMPI-settings-4.1-CUDA.eb new file mode 100644 index 0000000000000000000000000000000000000000..65d7ab3888dc45ab01de8cee6ef15b51995495ed --- /dev/null +++ b/Golden_Repo/o/OpenMPI-settings/OpenMPI-settings-4.1-CUDA.eb @@ -0,0 +1,53 @@ +easyblock = 'SystemBundle' + +name = 'OpenMPI-settings' +version = '4.1' +versionsuffix = 'CUDA' + +homepage = '' +description = '''This module loads the default OpenMPI configuration. It relies on UCX and enables the UCX CUDA +transports. +''' + +toolchain = SYSTEM + +source_urls = [] + +sources = [] +modextravars = { + 'SLURM_MPI_TYPE': 'pspmix', + 'OMPI_MCA_mca_base_component_show_load_errors': '1', + 'OMPI_MCA_mpi_param_check': '1', + 'OMPI_MCA_mpi_show_handle_leaks': '1', + 'OMPI_MCA_mpi_warn_on_fork': '1', + # Disable uct for the time being due to: + # https://github.com/openucx/ucx/wiki/OpenMPI-and-OpenSHMEM-installation-with-UCX#running-open-mpi-with-ucx + # Also openib, since it is deprecated and should be substituted by the UCX support in the pml + 'OMPI_MCA_btl': '^uct,openib', + 'OMPI_MCA_btl_openib_allow_ib': '1', + 'OMPI_MCA_bml_r2_show_unreach_errors': '0', + 'OMPI_MCA_pml': 'ucx', + 'OMPI_MCA_osc': '^rdma', + 'OMPI_MCA_opal_abort_print_stack': '1', + 'OMPI_MCA_opal_set_max_sys_limits': '1', + 'OMPI_MCA_opal_event_include': 'epoll', + 'OMPI_MCA_btl_openib_warn_default_gid_prefix': '0', + # OMPIO does not seem to work reliably on our system + 'OMPI_MCA_io': 'romio321', +} + +modluafooter = ''' +if mode()=="load" then + if isloaded("UCX-settings/RC") then + try_load("UCX-settings/RC-CUDA") + elseif isloaded("UCX-settings/UD") then + try_load("UCX-settings/UD-CUDA") + elseif isloaded("UCX-settings/DC") then + try_load("UCX-settings/DC-CUDA") + elseif not isloaded("UCX-settings") then + try_load("UCX-settings/RC-CUDA") + end +end +''' + +moduleclass = 'system' diff --git a/Golden_Repo/o/OpenMPI-settings/OpenMPI-settings-4.1-UCC.eb b/Golden_Repo/o/OpenMPI-settings/OpenMPI-settings-4.1-UCX-UCC.eb similarity index 88% rename from Golden_Repo/o/OpenMPI-settings/OpenMPI-settings-4.1-UCC.eb rename to Golden_Repo/o/OpenMPI-settings/OpenMPI-settings-4.1-UCX-UCC.eb index 1ca737acaa4f09ac727bc8477745af3e40cbb438..28d20bc68ef2f51e05fcd1f40707068ea7c1612e 100644 --- a/Golden_Repo/o/OpenMPI-settings/OpenMPI-settings-4.1-UCC.eb +++ b/Golden_Repo/o/OpenMPI-settings/OpenMPI-settings-4.1-UCX-UCC.eb @@ -2,10 +2,12 @@ easyblock = 'SystemBundle' name = 'OpenMPI-settings' version = '4.1' -versionsuffix = 'UCC' +versionsuffix = 'UCX-UCC' homepage = '' -description = 'This module loads the default OpenMPI configuration. It relies on UCX and UCC.' +description = '''This module loads the default OpenMPI configuration. It relies on UCX. It also rely on UCC for +collectives. +''' toolchain = SYSTEM diff --git a/Golden_Repo/o/OpenMPI-settings/OpenMPI-settings-4.1-plain.eb b/Golden_Repo/o/OpenMPI-settings/OpenMPI-settings-4.1-UCX.eb similarity index 98% rename from Golden_Repo/o/OpenMPI-settings/OpenMPI-settings-4.1-plain.eb rename to Golden_Repo/o/OpenMPI-settings/OpenMPI-settings-4.1-UCX.eb index 976a72395c89a83290827e85437f145954e8460e..4688f919ac6e2a7bfc8687453fd740d65c70265c 100644 --- a/Golden_Repo/o/OpenMPI-settings/OpenMPI-settings-4.1-plain.eb +++ b/Golden_Repo/o/OpenMPI-settings/OpenMPI-settings-4.1-UCX.eb @@ -2,7 +2,7 @@ easyblock = 'SystemBundle' name = 'OpenMPI-settings' version = '4.1' -versionsuffix = 'plain' +versionsuffix = 'UCX' homepage = '' description = 'This module loads the default OpenMPI configuration. It relies on UCX.' diff --git a/Golden_Repo/p/psmpi-settings/psmpi-settings-5.6-plain.eb b/Golden_Repo/p/psmpi-settings/psmpi-settings-5.6-plain.eb deleted file mode 100644 index 7586f6ec33262e33ea88f23a5090608f6f4c2287..0000000000000000000000000000000000000000 --- a/Golden_Repo/p/psmpi-settings/psmpi-settings-5.6-plain.eb +++ /dev/null @@ -1,19 +0,0 @@ -easyblock = 'SystemBundle' - -name = 'psmpi-settings' -version = '5.6' -versionsuffix = 'plain' - -homepage = '' -description = 'This module loads the ParaStationMPI configuration. It relies on the defaults.' - -toolchain = SYSTEM - -source_urls = [] - -sources = [] -modextravars = { - 'PSP_HARD_ABORT': '1', -} - -moduleclass = 'system'