From 3e879aab6bf5f6e902151e9d14c4fe76f6792e1f Mon Sep 17 00:00:00 2001 From: Jeff Daily Date: Thu, 14 Oct 2021 09:49:31 -0700 Subject: [PATCH] work around ucx in rocm ci Dockerfile (#9360) --- tools/ci_build/github/pai/rocm-ci-pipeline-env.Dockerfile | 7 +++++++ 1 file changed, 7 insertions(+) diff --git a/tools/ci_build/github/pai/rocm-ci-pipeline-env.Dockerfile b/tools/ci_build/github/pai/rocm-ci-pipeline-env.Dockerfile index aac42add29..2c9d9c6f05 100644 --- a/tools/ci_build/github/pai/rocm-ci-pipeline-env.Dockerfile +++ b/tools/ci_build/github/pai/rocm-ci-pipeline-env.Dockerfile @@ -2,6 +2,13 @@ FROM rocm/pytorch:rocm4.3.1_ubuntu18.04_py3.6_pytorch_1.9.0 WORKDIR /stage +# from rocm/pytorch's image, work around ucx's dlopen replacement conflicting with shared provider +RUN cd /opt/mpi_install/ucx/build &&\ + make clean &&\ + ../contrib/configure-release --prefix=/opt/ucx --without-rocm &&\ + make -j $(nproc) &&\ + make install + # rocm-ci branch contains instrumentation needed for loss curves and perf RUN git clone https://github.com/microsoft/huggingface-transformers.git &&\ cd huggingface-transformers &&\