mirror of
https://github.com/saymrwulf/onnxruntime.git
synced 2026-06-18 01:54:05 +00:00
### Description This PR is to update the win-ort-main branch to the tip main branch as of 2025-01-16. ### Motivation and Context This update includes the OpenVino fix for debug builds. --------- Signed-off-by: Liqun Fu <liqfu@microsoft.com> Signed-off-by: Liqun Fu <liqun.fu@microsoft.com> Signed-off-by: Junze Wu <junze.wu@intel.com> Signed-off-by: dependabot[bot] <support@github.com> Signed-off-by: Jianhui Dai <jianhui.j.dai@intel.com> Co-authored-by: Yueqing Zhang <yuz75@Pitt.edu> Co-authored-by: amancini-N <63410090+amancini-N@users.noreply.github.com> Co-authored-by: Adrian Lizarraga <adlizarraga@microsoft.com> Co-authored-by: liqun Fu <liqfu@microsoft.com> Co-authored-by: Guenther Schmuelling <guschmue@microsoft.com> Co-authored-by: Yifan Li <109183385+yf711@users.noreply.github.com> Co-authored-by: yf711 <yifanl@microsoft.com> Co-authored-by: Wanming Lin <wanming.lin@intel.com> Co-authored-by: wejoncy <wejoncy@163.com> Co-authored-by: wejoncy <wejoncy@.com> Co-authored-by: Scott McKay <skottmckay@gmail.com> Co-authored-by: Changming Sun <chasun@microsoft.com> Co-authored-by: Jean-Michaël Celerier <jeanmichael.celerier+github@gmail.com> Co-authored-by: Dmitry Deshevoy <mityada@gmail.com> Co-authored-by: xhcao <xinghua.cao@intel.com> Co-authored-by: Yueqing Zhang <yueqingz@amd.com> Co-authored-by: Yulong Wang <7679871+fs-eire@users.noreply.github.com> Co-authored-by: Jiajia Qin <jiajiaqin@microsoft.com> Co-authored-by: Wu, Junze <junze.wu@intel.com> Co-authored-by: Jian Chen <cjian@microsoft.com> Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> Co-authored-by: Matthieu Darbois <mayeut@users.noreply.github.com> Co-authored-by: Prathik Rao <prathik.rao@gmail.com> Co-authored-by: wonchung-microsoft <wonchung@microsoft.com> Co-authored-by: Vincent Wang <wangwchpku@outlook.com> Co-authored-by: PARK DongHa <luncliff@gmail.com> Co-authored-by: Hector Li <hecli@microsoft.com> Co-authored-by: Sam Webster <13457618+samwebster@users.noreply.github.com> Co-authored-by: Adrian Lizarraga <adrianlm2@gmail.com> Co-authored-by: Preetha Veeramalai <preetha.veeramalai@intel.com> Co-authored-by: jatinwadhwa921 <jatin.wadhwa@intel.com> Co-authored-by: Satya Kumar Jandhyala <satya.k.jandhyala@gmail.com> Co-authored-by: Corentin Maravat <101636442+cocotdf@users.noreply.github.com> Co-authored-by: Xiaoyu <85524621+xiaoyu-work@users.noreply.github.com> Co-authored-by: Tianlei Wu <tlwu@microsoft.com> Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com> Co-authored-by: Jie Chen <jie.a.chen@intel.com> Co-authored-by: Jianhui Dai <jianhui.j.dai@intel.com> Co-authored-by: Copilot <175728472+Copilot@users.noreply.github.com> Co-authored-by: Edward Chen <18449977+edgchen1@users.noreply.github.com> Co-authored-by: Baiju Meswani <bmeswani@microsoft.com> Co-authored-by: kunal-vaishnavi <115581922+kunal-vaishnavi@users.noreply.github.com> Co-authored-by: Justin Chu <justinchuby@users.noreply.github.com> Co-authored-by: Copilot Autofix powered by AI <62310815+github-advanced-security[bot]@users.noreply.github.com> Co-authored-by: Ted Themistokleous <107195283+TedThemistokleous@users.noreply.github.com> Co-authored-by: Jeff Daily <jeff.daily@amd.com> Co-authored-by: Artur Wojcik <artur.wojcik@outlook.com> Co-authored-by: Ted Themistokleous <tedthemistokleous@amd.com> Co-authored-by: Xinya Zhang <Xinya.Zhang@amd.com> Co-authored-by: ikalinic <ilija.kalinic@amd.com> Co-authored-by: sstamenk <sstamenk@amd.com> Co-authored-by: Yi-Hong Lyu <yilyu@microsoft.com> Co-authored-by: Ti-Tai Wang <titaiwang@microsoft.com>
112 lines
4.1 KiB
Text
112 lines
4.1 KiB
Text
# --------------------------------------------------------------
|
|
# Copyright (c) Microsoft Corporation. All rights reserved.
|
|
# Licensed under the MIT License.
|
|
# --------------------------------------------------------------
|
|
# Build onnxruntime-gpu python package with CUDA 12.x & CUDNN 9.x for python 3.12 in Ubuntu 24.04.
|
|
# If memory is less than 64GB, you may change "--parallel" to "--parallel 4" to avoid out-of-memory error.
|
|
|
|
ARG CUDA_VERSION=12.6.1
|
|
ARG CUDNN_VERSION=9.5.0.50
|
|
ARG OS=ubuntu24.04
|
|
|
|
FROM nvcr.io/nvidia/cuda:${CUDA_VERSION}-devel-${OS}
|
|
ARG CUDA_VERSION
|
|
ARG CUDNN_VERSION
|
|
# Adjust as needed
|
|
# Check your CUDA arch: https://developer.nvidia.com/cuda-gpus
|
|
ARG CMAKE_CUDA_ARCHITECTURES="75;80;90"
|
|
|
|
ENV DEBIAN_FRONTEND=noninteractive
|
|
|
|
# Add source code to /code
|
|
ADD . /code
|
|
|
|
ENV PATH=/usr/local/cuda/bin:${PATH}
|
|
|
|
# Install required packages
|
|
RUN apt-get update && apt-get install -y --no-install-recommends \
|
|
ca-certificates \
|
|
g++ \
|
|
gcc \
|
|
make \
|
|
git \
|
|
cmake \
|
|
wget \
|
|
ninja-build \
|
|
python3-pip \
|
|
python3.12-dev \
|
|
python3.12-venv \
|
|
&& rm -rf /var/lib/apt/lists/*
|
|
|
|
# Install CUDNN 9.4.0.58 for building ONNX Runtime with CUDA.
|
|
RUN cudnn_tar="cudnn-linux-x86_64-${CUDNN_VERSION}_cuda${CUDA_VERSION%%.*}-archive.tar.xz" \
|
|
&& wget "https://developer.download.nvidia.com/compute/cudnn/redist/cudnn/linux-x86_64/${cudnn_tar}" \
|
|
&& mkdir -p /code/build/cudnn \
|
|
&& tar -Jxvf ${cudnn_tar} -C /code/build/cudnn --strip=1 \
|
|
&& rm -f ${cudnn_tar}
|
|
|
|
# Create a virtual environment and install dependencies, then build ONNX Runtime with CUDA support.
|
|
RUN cd /code \
|
|
&& python3 -m venv /code/env \
|
|
&& . /code/env/bin/activate \
|
|
&& pip install --upgrade psutil setuptools wheel packaging \
|
|
&& pip install -r /code/tools/ci_build/github/linux/python/requirements.txt \
|
|
&& python /code/tools/ci_build/build.py --build_dir /code/build/Linux \
|
|
--allow_running_as_root --skip_submodule_sync \
|
|
--use_cuda --cuda_home /usr/local/cuda \
|
|
--cudnn_home /code/build/cudnn \
|
|
--build_shared_lib --skip_tests \
|
|
--config Release --build_wheel --update --build --parallel \
|
|
--cmake_generator Ninja \
|
|
--cmake_extra_defines ONNXRUNTIME_VERSION=$(cat ./VERSION_NUMBER) "CMAKE_CUDA_ARCHITECTURES=${CMAKE_CUDA_ARCHITECTURES}" onnxruntime_BUILD_UNIT_TESTS=OFF
|
|
|
|
# Start second stage to copy the build artifacts
|
|
FROM nvcr.io/nvidia/cuda:${CUDA_VERSION}-runtime-${OS}
|
|
ARG CUDA_VERSION
|
|
ARG CUDNN_VERSION
|
|
ARG GIT_COMMIT
|
|
ARG GIT_BRANCH
|
|
ARG ONNXRUNTIME_VERSION
|
|
|
|
# Make sure the required build arguments are set. See README.md for more information.
|
|
RUN test -n ${GIT_COMMIT:?}
|
|
RUN test -n ${GIT_BRANCH:?}
|
|
RUN test -n ${ONNXRUNTIME_VERSION:?}
|
|
|
|
LABEL CUDA_VERSION="${CUDA_VERSION}"
|
|
LABEL CUDNN_VERSION="${CUDNN_VERSION}"
|
|
LABEL maintainer="Changming Sun <chasun@microsoft.com>"
|
|
LABEL onnxruntime_version="${ONNXRUNTIME_VERSION}"
|
|
LABEL onnxruntime_git_branch="${GIT_BRANCH}"
|
|
LABEL onnxruntime_git_commit="${GIT_COMMIT}"
|
|
|
|
# Copy built wheel and license
|
|
COPY --from=0 /code/build/Linux/Release/dist /ort
|
|
COPY --from=0 /code/dockerfiles/LICENSE-IMAGE.txt /code/LICENSE-IMAGE.txt
|
|
|
|
# Set environment variables
|
|
ENV DEBIAN_FRONTEND=noninteractive
|
|
ENV CUDNN_VERSION=$CUDNN_VERSION
|
|
ENV ONNXRUNTIME_VERSION=$ONNXRUNTIME_VERSION
|
|
# CUDNN from nvidia-cudnn-cu12 python package is located in the site-packages directory of python virtual environment.
|
|
ENV LD_LIBRARY_PATH="/ort/env/lib/python3.12/site-packages/nvidia/cudnn/lib:/usr/local/cuda/lib64"
|
|
|
|
# Install runtime dependencies
|
|
RUN apt-get update && apt-get install -y --no-install-recommends \
|
|
libstdc++6 \
|
|
ca-certificates \
|
|
python3-pip \
|
|
python3.12-venv \
|
|
&& python3 -m venv /ort/env \
|
|
&& . /ort/env/bin/activate \
|
|
&& pip install /ort/*.whl \
|
|
&& pip install nvidia-cudnn-cu${CUDA_VERSION%%.*}==${CUDNN_VERSION} \
|
|
&& python -c 'import onnxruntime; print(onnxruntime.get_available_providers())' \
|
|
&& rm -rf /ort/*.whl \
|
|
&& rm -rf /var/lib/apt/lists/*
|
|
|
|
# Ensure the virtual environment is always activated when running commands in the container.
|
|
RUN echo ". /ort/env/bin/activate" >> ~/.bashrc
|
|
|
|
# Set the default command to start an interactive bash shell
|
|
CMD [ "/bin/bash" ]
|