mirror of
https://github.com/saymrwulf/onnxruntime.git
synced 2026-05-14 20:48:00 +00:00
### Description Previous image is based on cuda 12.1 and cudnn 8, which is out of date since we have moved to cudnn 9 since 1.19 release. (1) Upgrade base image to cuda 12.5.1 and cudnn 9. (2) Update CMAKE_CUDA_ARCHITECTURES from 52;60;61;70;75;86 to 61;70;75;80;86;90 to support A100 and H100 (3) Make the build faster: exclude unit test; use ninja etc. (4) upgrade some packages (like packaging etc) before building to avoid build error. ### Motivation and Context https://github.com/microsoft/onnxruntime/issues/21792 https://github.com/microsoft/onnxruntime/issues/21532
41 lines
1.9 KiB
Text
41 lines
1.9 KiB
Text
# --------------------------------------------------------------
|
|
# Copyright (c) Microsoft Corporation. All rights reserved.
|
|
# Licensed under the MIT License.
|
|
# --------------------------------------------------------------
|
|
# Build onnxruntime-gpu python package with CUDA 12.5 & CUDNN 9 for Nvidia GPU compute capability 6.1, 7.x, 8.x, 9.x.
|
|
# If memory is less than 64GB, you may change "--parallel" to "--parallel 4" to avoid out-of-memory error.
|
|
|
|
FROM nvcr.io/nvidia/cuda:12.5.1-cudnn-devel-ubuntu22.04
|
|
|
|
ARG CMAKE_CUDA_ARCHITECTURES=61;70;75;80;86;90
|
|
|
|
ENV DEBIAN_FRONTEND=noninteractive
|
|
MAINTAINER Changming Sun "chasun@microsoft.com"
|
|
ADD . /code
|
|
|
|
ENV PATH /usr/local/nvidia/bin:/usr/local/cuda/bin:${PATH}
|
|
RUN apt-get update \
|
|
&& apt-get install -y --no-install-recommends ca-certificates g++ gcc make git python3-dev python3-pip
|
|
|
|
RUN cd /code \
|
|
&& python3 -m pip install --upgrade pip cmake psutil setuptools wheel packaging ninja \
|
|
&& python3 -m pip install -r tools/ci_build/github/linux/docker/inference/x86_64/python/cpu/scripts/requirements.txt \
|
|
&& /bin/bash ./build.sh --allow_running_as_root --skip_submodule_sync \
|
|
--use_cuda --cuda_home /usr/local/cuda --cudnn_home /usr/lib/x86_64-linux-gnu/ \
|
|
--build_shared_lib --skip_tests \
|
|
--config Release --build_wheel --update --build --parallel \
|
|
--cmake_generator Ninja \
|
|
--enable_cuda_nhwc_ops \
|
|
--cmake_extra_defines ONNXRUNTIME_VERSION=$(cat ./VERSION_NUMBER) \
|
|
onnxruntime_BUILD_UNIT_TESTS=OFF \
|
|
`CMAKE_CUDA_ARCHITECTURES=${CMAKE_CUDA_ARCHITECTURES}`
|
|
|
|
FROM nvcr.io/nvidia/cuda:12.5.1-cudnn-runtime-ubuntu22.04
|
|
ENV DEBIAN_FRONTEND=noninteractive
|
|
COPY --from=0 /code/build/Linux/Release/dist /root
|
|
COPY --from=0 /code/dockerfiles/LICENSE-IMAGE.txt /code/LICENSE-IMAGE.txt
|
|
RUN apt-get update \
|
|
&& apt-get install -y --no-install-recommends libstdc++6 ca-certificates python3-setuptools python3-wheel python3-pip unattended-upgrades \
|
|
&& unattended-upgrade \
|
|
&& python3 -m pip install /root/*.whl \
|
|
&& rm -rf /root/*.whl
|