File tree Expand file tree Collapse file tree 1 file changed +0
-21
lines changed Expand file tree Collapse file tree 1 file changed +0
-21
lines changed Original file line number Diff line number Diff line change 8484 end
8585end
8686
87- local function eessi_openmpi_load_hook(t)
88- -- disable smcuda BTL when loading OpenMPI module for aarch64/neoverse_v1,
89- -- to work around hang/crash due to bug in OpenMPI;
90- -- see https://gitlab.com/eessi/support/-/issues/41
91- local frameStk = require("FrameStk"):singleton()
92- local mt = frameStk:mt()
93- local moduleName = string.match(t.modFullName, "(.-)/")
94- local cpuTarget = os.getenv("EESSI_SOFTWARE_SUBDIR") or ""
95- if (moduleName == "OpenMPI") and (cpuTarget == "aarch64/neoverse_v1") then
96- local msg = "Adding '^smcuda' to $OMPI_MCA_btl to work around bug in OpenMPI"
97- LmodMessage(msg .. " (see https://gitlab.com/eessi/support/-/issues/41)")
98- local ompiMcaBtl = os.getenv("OMPI_MCA_btl")
99- if ompiMcaBtl == nil then
100- setenv("OMPI_MCA_btl", "^smcuda")
101- else
102- setenv("OMPI_MCA_btl", ompiMcaBtl .. ",^smcuda")
103- end
104- end
105- end
106-
10787-- Combine both functions into a single one, as we can only register one function as load hook in lmod
10888-- Also: make it non-local, so it can be imported and extended by other lmodrc files if needed
10989function eessi_load_hook(t)
11090 eessi_cuda_enabled_load_hook(t)
111- eessi_openmpi_load_hook(t)
11291end
11392
11493
You can’t perform that action at this time.
0 commit comments