From 2bfe2c69b7ed4b226b8cb567df03c8077dcff0c4 Mon Sep 17 00:00:00 2001 From: Ashwini Khade Date: Thu, 21 Apr 2022 14:59:15 -0700 Subject: [PATCH] rocm pipeline fix for rel-1.11.1 (#11283) * fix rocm pipeline for 1.11.1 release * plus cosmetic changes --- ...orttraining-py-packaging-pipeline-rocm.yml | 39 +++++++++++++++---- 1 file changed, 32 insertions(+), 7 deletions(-) diff --git a/tools/ci_build/github/azure-pipelines/orttraining-py-packaging-pipeline-rocm.yml b/tools/ci_build/github/azure-pipelines/orttraining-py-packaging-pipeline-rocm.yml index 942c092e98..73ad7dda2a 100644 --- a/tools/ci_build/github/azure-pipelines/orttraining-py-packaging-pipeline-rocm.yml +++ b/tools/ci_build/github/azure-pipelines/orttraining-py-packaging-pipeline-rocm.yml @@ -10,12 +10,25 @@ stages: clean: all pool: AMD-GPU steps: - - template: templates/ get-docker-image-steps.yml + - template: templates/get-docker-image-steps.yml + parameters: + Dockerfile: tools/ci_build/github/linux/docker/Dockerfile.manylinux2014_rocm4_2 + Context: tools/ci_build/github/linux/docker + DockerBuildArgs: >- + --build-arg TORCH_VERSION=1.10.0 + --build-arg INSTALL_DEPS_EXTRA_ARGS=-tmur + --build-arg BUILD_UID=$(id -u) + --network=host --build-arg POLICY=manylinux2014 --build-arg PLATFORM=x86_64 + --build-arg DEVTOOLSET_ROOTPATH=/opt/rh/devtoolset-10/root + --build-arg PREPEND_PATH=/opt/rh/devtoolset-10/root/usr/bin: + --build-arg LD_LIBRARY_PATH_ARG=/opt/rh/devtoolset-10/root/usr/lib64:/opt/rh/devtoolset-10/root/usr/lib:/opt/rh/devtoolset-10/root/usr/lib64/dyninst:/opt/rh/devtoolset-10/root/usr/lib/dyninst:/usr/local/lib64:/usr/local/lib + Repository: onnxruntimetrainingrocmbuild-torch1.10.0-rocm4.2 + - template: templates/get-docker-image-steps.yml parameters: Dockerfile: tools/ci_build/github/linux/docker/Dockerfile.manylinux2014_rocm4_3_1 Context: tools/ci_build/github/linux/docker DockerBuildArgs: >- - --build-arg TORCH_VERSION=1.11.0 + --build-arg TORCH_VERSION=1.10.0 --build-arg INSTALL_DEPS_EXTRA_ARGS=-tmur --build-arg BUILD_UID=$(id -u) --network=host --build-arg POLICY=manylinux2014 --build-arg PLATFORM=x86_64 @@ -23,12 +36,12 @@ stages: --build-arg PREPEND_PATH=/opt/rh/devtoolset-10/root/usr/bin: --build-arg LD_LIBRARY_PATH_ARG=/opt/rh/devtoolset-10/root/usr/lib64:/opt/rh/devtoolset-10/root/usr/lib:/opt/rh/devtoolset-10/root/usr/lib64/dyninst:/opt/rh/devtoolset-10/root/usr/lib/dyninst:/usr/local/lib64:/usr/local/lib Repository: onnxruntimetrainingrocmbuild-torch1.10.0-rocm4.3.1 - - template: templates/ get-docker-image-steps.yml + - template: templates/get-docker-image-steps.yml parameters: Dockerfile: tools/ci_build/github/linux/docker/Dockerfile.manylinux2014_rocm5_0_1 Context: tools/ci_build/github/linux/docker DockerBuildArgs: >- - --build-arg TORCH_VERSION=1.11.0 + --build-arg TORCH_VERSION=1.10.0 --build-arg INSTALL_DEPS_EXTRA_ARGS=-tmur --build-arg BUILD_UID=$(id -u) --network=host --build-arg POLICY=manylinux2014 --build-arg PLATFORM=x86_64 @@ -47,6 +60,18 @@ stages: - ROCm_build_environment strategy: matrix: + Python37 Torch1100 Rocm42: + PythonVersion: '3.7' + TorchVersion: '1.10.0' + RocmVersion: '4.2' + Python38 Torch1100 Rocm42: + PythonVersion: '3.8' + TorchVersion: '1.10.0' + RocmVersion: '4.2' + Python39 Torch1100 Rocm42: + PythonVersion: '3.9' + TorchVersion: '1.10.0' + RocmVersion: '4.2' Python37 Torch1100 Rocm431: PythonVersion: '3.7' TorchVersion: '1.10.0' @@ -77,7 +102,7 @@ stages: clean: true submodules: recursive - - template: templates/ set-python-manylinux-variables-step.yml + - template: templates/set-python-manylinux-variables-step.yml - task: CmdLine@2 inputs: @@ -297,8 +322,8 @@ stages: condition: and(succeeded(), eq(variables['DRY_RUN'], '0')) displayName: 'Upload Rocm wheel to release repository' - - template: templates/ component-governance-component-detection-steps.yml + - template: templates/component-governance-component-detection-steps.yml parameters: condition: 'succeeded' - - template: templates/ clean-agent-build-directory-step.yml + - template: templates/clean-agent-build-directory-step.yml