33# Based on https://github.com/amd/InfinityHub-CI/tree/main/base-gpu-mpi-rocm-docker
44##############################################################
55
6- ARG ROCM_VERSION=5.5.1
6+ ARG ROCM_VERSION=6.3.2
77
88FROM rocm/dev-ubuntu-22.04:${ROCM_VERSION}-complete as sdk-base
99
10- ARG UCX_BRANCH="v1.13 .1"
11- ARG OMPI_BRANCH="v4.1.4 "
10+ ARG UCX_BRANCH="v1.14 .1"
11+ ARG OMPI_BRANCH="v5.0.6 "
1212
1313# Update and Install basic Linux development tools
1414RUN rm /etc/apt/sources.list.d/* \
@@ -46,7 +46,7 @@ ENV ROCM_HOME=/opt/rocm \
4646 OMPI_HOME=/opt/ompi
4747
4848# Until rocm base has it fixed
49- RUN ln -s /opt/rocm/llvm/bin/offload-arch /opt/rocm/bin/offload-arch
49+ RUN ln -s /opt/rocm/llvm/bin/offload-arch /opt/rocm/bin/offload-arch | echo "offload-arch already exis"
5050
5151# Install tmpi
5252RUN curl https://raw.githubusercontent.com/Azrael3000/tmpi/master/tmpi -o /usr/local/bin/tmpi
@@ -73,10 +73,14 @@ RUN cd /tmp/ \
7373 --without-knem \
7474 --without-xpmem \
7575 --without-cuda \
76+ --without-java \
77+ --enable-mt \
7678 --enable-optimizations \
7779 --disable-logging \
7880 --disable-debug \
7981 --disable-examples \
82+ --disable-assertions \
83+ --disable-params-check \
8084 && make -j ${nproc} \
8185 && make install
8286
@@ -87,17 +91,22 @@ RUN cd /tmp \
8791 && ./autogen.pl \
8892 && mkdir build \
8993 && cd build \
90- && ../configure --prefix=$OMPI_HOME --with-ucx=$UCX_HOME \
91- CC=amdclang CXX=amdclang++ FC=amdflang F90=amdflang \
92- --enable-mca-no-build=btl-uct \
94+ && ../configure CC=amdclang CXX=amdclang++ FC=amdflang F90=amdflang \
95+ --prefix=$OMPI_HOME \
96+ --with-ucx=$UCX_HOME \
97+ --with-rocm=$ROCM_HOME \
98+ --enable-mca-no-build=btl-uct \
9399 --without-verbs \
94- --with-pmix \
95- --enable-mpi \
96- --enable-mpi-fortran=yes \
100+ --enable-mpi1-compatibility \
101+ --enable-mpi-fortran=no \
97102 --disable-debug \
98103 && make -j ${nproc} \
99104 && make install
100105
106+ # UCX config
107+ ENV UCX_WARN_UNUSED_ENV_VARS=n
108+ ENV UCX_TLS=sm,self,rocm,rocm_copy,rocm_ipc
109+
101110# Cleanup
102111RUN rm -rf /tmp/ucx && rm -rf /tmp/ompi
103112
0 commit comments