onnxruntime

mirror of https://github.com/saymrwulf/onnxruntime.git synced 2026-07-21 19:18:55 +00:00

History

Tianlei Wu 9e18b6a0f3 [CUDA] Update nvcc flags (#23572 ) ### Description (1) Remove `if (CMAKE_CUDA_COMPILER_VERSION VERSION_GREATER_EQUAL 11)` since build requires cuda >= 11.4. (2) Add sm_86 and sm_89 since we generate SASS code for specified cuda architectures only. This change could support popular consumer GPUs (like RTX 30X0 and RTX 40X0). (3) Add sm_120 to support Blackwell GPUs (like RTX 50X0 etc). (4) Add `-Xfatbin=-compress-all` to reduce wheel size. When CMAKE_CUDA_ARCHITECTURES is not specified, the linux wheel size built by CUDA 12.8 is reduced 8% (from 324MB to 299MB). ### Motivation and Context To support popular consumer GPUs (RTX 30x0, 40x0, 50x0) in the default setting. Reduce binary size. Note that the default sm settings does not impact official released binary. ORT official released binary are built with augmentation like CMAKE_CUDA_ARCHITECTURES=75;80;90, which has both SASS (real) and PTX (virtual) by default. See https://cmake.org/cmake/help/latest/prop_tgt/CUDA_ARCHITECTURES.html for more info.		2025-02-04 11:47:02 -08:00
..
external	remove log spam from cpuinfo (#23548 )	2025-01-31 18:16:24 -08:00
patches	remove log spam from cpuinfo (#23548 )	2025-01-31 18:16:24 -08:00
tensorboard
vcpkg-ports	Use latest vcpkg commit in configuration, sync manifest with deps.txt (#23554 )	2025-01-31 12:34:07 -08:00
vcpkg-triplets	Update the compile flags for vcpkg packages (#23455 )	2025-01-22 11:48:38 -08:00
adjust_global_compile_flags.cmake	Update ORT extension to the latest (#23314 )	2025-01-13 18:59:42 -08:00
arm64x.cmake	Dev/mookerem/arm64x update (#20536 )	2024-05-07 12:50:38 -07:00
CMakeLists.txt	[CUDA] Update nvcc flags (#23572 )	2025-02-04 11:47:02 -08:00
CMakePresets.json	Correct ONNX and Protobuf version in vcpkg build (#23285 )	2025-01-08 12:25:17 -08:00
CMakeSettings.json
codeconv.runsettings
deps.txt	[webgpu] Bump version of Dawn to b9b4a370 (#23494 )	2025-01-27 14:02:06 -08:00
deps_update_and_upload.py
EnableVisualStudioCodeAnalysis.props
gdk_toolchain.cmake
hip_fatbin_insert	[MIGraphX EP/ ROCm EP] add gfx1200, gfx1201 to CMAKE_HIP_ARCHITECTURES (#22348 )	2024-10-11 17:31:36 -07:00
Info.plist.in
libonnxruntime.pc.cmake.in
linux_arm32_crosscompile_toolchain.cmake
linux_arm64_crosscompile_toolchain.cmake
maccatalyst_prepare_objects_for_prelink.py
nuget_helpers.cmake	Update nuget.exe used in WindowsAI nuget packaging so `readme` property is supported. (#22141 )	2024-09-19 19:06:47 +10:00
onnxruntime.cmake	[QNN EP] Make QNN EP a shared library (#23120 )	2025-01-22 12:11:00 -08:00
onnxruntime_common.cmake	Enable QNN HTP support for Node (#20576 )	2024-05-09 13:11:07 -07:00
onnxruntime_compile_triton_kernel.cmake
onnxruntime_config.h.in	Pre-requisites of upgrading EMSDK (#23347 )	2025-01-14 11:07:21 -08:00
onnxruntime_csharp.cmake	Cleanup code (#22827 )	2024-11-19 14:13:33 -08:00
onnxruntime_flatbuffers.cmake
onnxruntime_framework.cmake	Adding CUDNN Frontend and use for CUDA NN Convolution (#19470 )	2024-08-02 15:16:42 -07:00
onnxruntime_framework.natvis
onnxruntime_fuzz_test.cmake	[Fuzzer] Add two new ORT libfuzzer (Linux clang support for now) (#22055 )	2024-09-12 11:50:34 -07:00
onnxruntime_graph.cmake
onnxruntime_ios.toolchain.cmake
onnxruntime_java.cmake	[QNN EP] Make QNN EP a shared library (#23120 )	2025-01-22 12:11:00 -08:00
onnxruntime_java_unittests.cmake	[Java] Add API for appending QNN EP (#22208 )	2024-10-01 10:18:04 -07:00
onnxruntime_kernel_explorer.cmake	[ROCm] prefer hip interfaces over roc during hipify (#22394 )	2024-10-14 20:34:03 -07:00
onnxruntime_lora.cmake	Multi-Lora support (#22046 )	2024-09-30 15:59:07 -07:00
onnxruntime_mlas.cmake	[ARM CPU] hgemm optimized for gqa (#23107 )	2025-01-24 15:25:24 -08:00
onnxruntime_nodejs.cmake	Fix delay load for WebGPU EP and DML EP (#23111 )	2024-12-19 10:23:48 -08:00
onnxruntime_objectivec.cmake	Initial WebGPU EP checkin (#22318 )	2024-10-08 16:10:46 -07:00
onnxruntime_opschema_lib.cmake
onnxruntime_optimizer.cmake	Update Linux docker images (#23244 )	2025-01-09 10:20:33 -08:00
onnxruntime_providers.cmake	[QNN EP] Make QNN EP a shared library (#23120 )	2025-01-22 12:11:00 -08:00
onnxruntime_providers_acl.cmake
onnxruntime_providers_armnn.cmake
onnxruntime_providers_azure.cmake
onnxruntime_providers_cann.cmake	Remove nsync (#20413 )	2024-10-21 15:32:14 -07:00
onnxruntime_providers_coreml.cmake	Enable coremltools for Linux build (#23481 )	2025-01-24 18:18:37 -08:00
onnxruntime_providers_cpu.cmake	Enable dlpack by default (#23110 )	2025-01-30 23:23:56 +01:00
onnxruntime_providers_cuda.cmake	Cleanup code (#22827 )	2024-11-19 14:13:33 -08:00
onnxruntime_providers_dml.cmake	Refactor the cmake code that is related to delay loading (#22646 )	2024-11-04 16:30:50 -08:00
onnxruntime_providers_dnnl.cmake	Remove nsync (#20413 )	2024-10-21 15:32:14 -07:00
onnxruntime_providers_js.cmake
onnxruntime_providers_migraphx.cmake	Remove nsync (#20413 )	2024-10-21 15:32:14 -07:00
onnxruntime_providers_nnapi.cmake
onnxruntime_providers_openvino.cmake	OVEP 1.21.0 Development Updates (#23080 )	2024-12-11 22:26:32 -08:00
onnxruntime_providers_qnn.cmake	[QNN EP] Make QNN EP a shared library (#23120 )	2025-01-22 12:11:00 -08:00
onnxruntime_providers_rknpu.cmake
onnxruntime_providers_rocm.cmake	Remove nsync (#20413 )	2024-10-21 15:32:14 -07:00
onnxruntime_providers_tensorrt.cmake	Remove nsync (#20413 )	2024-10-21 15:32:14 -07:00
onnxruntime_providers_vitisai.cmake	[VitisAI] Cache node subgraph when necessary (#22073 )	2024-11-08 23:17:16 -08:00
onnxruntime_providers_vsinpu.cmake	Remove nsync (#20413 )	2024-10-21 15:32:14 -07:00
onnxruntime_providers_webgpu.cmake	[WebGPU] allow build WebGPU EP for WebAssembly (#23364 )	2025-01-16 10:52:17 -08:00
onnxruntime_providers_webnn.cmake
onnxruntime_providers_xnnpack.cmake
onnxruntime_python.cmake	Enable dlpack by default (#23110 )	2025-01-30 23:23:56 +01:00
onnxruntime_rocm_hipify.cmake	[ROCm] redo hipify of version controlled files (#22449 )	2024-10-18 12:40:54 -07:00
onnxruntime_session.cmake	Multi-Lora support (#22046 )	2024-09-30 15:59:07 -07:00
onnxruntime_snpe_provider.cmake
onnxruntime_training.cmake	Multi-Lora support (#22046 )	2024-09-30 15:59:07 -07:00
onnxruntime_unittests.cmake	[QNN EP] Make QNN EP a shared library (#23120 )	2025-01-22 12:11:00 -08:00
onnxruntime_util.cmake
onnxruntime_visionos.toolchain.cmake
onnxruntime_webassembly.cmake	[WebGPU] allow build WebGPU EP for WebAssembly (#23364 )	2025-01-16 10:52:17 -08:00
precompiled_header.cmake
riscv64.toolchain.cmake
Sdl.ruleset
set_winapi_family_desktop.h
target_delayload.cmake	Refactor the cmake code that is related to delay loading (#22646 )	2024-11-04 16:30:50 -08:00
uwp_stubs.h
vcpkg-configuration.json	Use latest vcpkg commit in configuration, sync manifest with deps.txt (#23554 )	2025-01-31 12:34:07 -08:00
vcpkg.json	Use latest vcpkg commit in configuration, sync manifest with deps.txt (#23554 )	2025-01-31 12:34:07 -08:00
wcos_rules_override.cmake
winml.cmake	Fix a tiny problem in winml.cmake (#23173 )	2024-12-20 11:48:43 -08:00
winml_cppwinrt.cmake
winml_sdk_helpers.cmake
winml_unittests.cmake	Multi-Lora support (#22046 )	2024-09-30 15:59:07 -07:00