onnxruntime/tools/ci_build/github/azure-pipelines/orttraining-linux-gpu-on-device-training.yml
Adam Louly ee543a47f6
upgrade cuda version on ci pipelines (training CI pipelines) (#12708)
* upgrade cuda version on ci pipelines

* keeping folder name same

* keeping folder name same

* setting manual seed for primitive test case

* resolving comments

* changing atol and rtrol only for test case

Co-authored-by: Adam Louly <adamlouly@microsoft.com@orttrainingdev7.d32nl1ml4oruzj4qz3bqlggovf.px.internal.cloudapp.net>
2022-08-26 16:51:19 -07:00

48 lines
1.5 KiB
YAML

trigger: none
jobs:
- job: Onnxruntime_Linux_GPU_OnDeviceTraining
timeoutInMinutes: 120
pool: 'Onnxruntime-Linux-GPU-NC6sv3'
steps:
- checkout: self
clean: true
submodules: recursive
- template: templates/run-docker-build-steps.yml
parameters:
RunDockerBuildArgs: |
-o ubuntu20.04 -d gpu -e \
-t onnxruntime_ondevicetraining_tests_image \
-x " \
--config RelWithDebInfo \
--enable_training \
--enable_training_on_device \
--use_cuda --cuda_version=11.6 --cuda_home=/usr/local/cuda-11.6 --cudnn_home=/usr/local/cuda-11.6 \
--build_wheel \
--skip_tests \
" \
-u
DisplayName: 'Build onnxruntime'
# Entry point for all on device training tests
- script: |
docker run \
--gpus all \
--shm-size=1024m \
--rm \
--volume $(Build.SourcesDirectory):/onnxruntime_src \
--volume $(Build.BinariesDirectory):/build \
onnxruntime_ondevicetraining_tests_image \
/build/RelWithDebInfo/launch_test.py \
--cwd /build/RelWithDebInfo --cmd_line_with_args "python orttraining_on_device_training_tests.py --cwd /build/RelWithDebInfo" \
displayName: 'Run On-Device Training Tests'
condition: succeededOrFailed()
timeoutInMinutes: 120
- template: templates/component-governance-component-detection-steps.yml
parameters:
condition: 'succeeded'
- template: templates/clean-agent-build-directory-step.yml