mirror of
https://github.com/saymrwulf/onnxruntime.git
synced 2026-06-04 23:59:56 +00:00
Implement CloudEP for hybrid inferencing. The PR introduces zero new API, customers could configure session and run options to do inferencing with Azure [triton endpoint.](https://learn.microsoft.com/en-us/azure/machine-learning/how-to-deploy-with-triton?tabs=azure-cli%2Cendpoint) Sample configuration in python be like: ``` sess_opt.add_session_config_entry('cloud.endpoint_type', 'triton'); sess_opt.add_session_config_entry('cloud.uri', 'https://cloud.com'); sess_opt.add_session_config_entry('cloud.model_name', 'detection2'); sess_opt.add_session_config_entry('cloud.model_version', '7'); // optional, default 1 sess_opt.add_session_config_entry('cloud.verbose', '1'); // optional, default '0', meaning no verbose ... run_opt.add_run_config_entry('use_cloud', '1') # 0 for local inferencing, 1 for cloud endpoint. run_opt.add_run_config_entry('cloud.auth_key', '...') ... sess.run(None, {'input':input_}, run_opt) ``` Co-authored-by: Randy Shuai <rashuai@microsoft.com>
69 lines
No EOL
1.8 KiB
YAML
69 lines
No EOL
1.8 KiB
YAML
parameters:
|
|
- name: enable_linux_cpu
|
|
displayName: 'Whether Linux CPU package is built.'
|
|
type: boolean
|
|
default: true
|
|
|
|
- name: enable_ubuntu_cpu
|
|
displayName: 'Whether Ubuntu CPU (manylinux_2_27) package is built.'
|
|
type: boolean
|
|
default: true
|
|
|
|
- name: enable_linux_gpu
|
|
displayName: 'Whether Linux GPU package is built.'
|
|
type: boolean
|
|
default: true
|
|
|
|
- name: enable_windows_cpu
|
|
displayName: 'Whether Windows CPU package is built.'
|
|
type: boolean
|
|
default: true
|
|
|
|
- name: enable_windows_gpu
|
|
displayName: 'Whether Windows GPU package is built.'
|
|
type: boolean
|
|
default: true
|
|
|
|
- name: enable_mac_cpu
|
|
displayName: 'Whether Mac CPU package is built.'
|
|
type: boolean
|
|
default: true
|
|
|
|
- name: enable_mac_silicon
|
|
displayName: 'Whether Mac silicon package is built.'
|
|
type: boolean
|
|
default: true
|
|
|
|
- name: enable_linux_arm
|
|
displayName: 'Whether Linux ARM package is built.'
|
|
type: boolean
|
|
default: true
|
|
|
|
- name: build_py_parameters
|
|
displayName: 'Specify extra build parameters'
|
|
type: string
|
|
default: 'NONE'
|
|
|
|
trigger: none
|
|
|
|
resources:
|
|
repositories:
|
|
- repository: manylinux
|
|
type: Github
|
|
endpoint: Microsoft
|
|
name: pypa/manylinux
|
|
ref: 1a61614cabfd6b91c6afd6d9e172cc5b838c65fe
|
|
|
|
stages:
|
|
- template: templates/py-packaging-stage.yml
|
|
parameters:
|
|
enable_linux_gpu: ${{ parameters.enable_linux_gpu }}
|
|
enable_ubuntu_cpu: ${{ parameters.enable_ubuntu_cpu }}
|
|
enable_linux_cpu: ${{ parameters.enable_linux_cpu }}
|
|
enable_windows_cpu: ${{ parameters.enable_windows_cpu }}
|
|
enable_windows_gpu: ${{ parameters.enable_windows_gpu }}
|
|
enable_mac_cpu: ${{ parameters.enable_mac_cpu }}
|
|
enable_mac_silicon: ${{ parameters.enable_mac_silicon }}
|
|
enable_linux_arm: ${{ parameters.enable_linux_arm }}
|
|
${{ if not(eq(parameters.build_py_parameters, 'NONE')) }}:
|
|
build_py_parameters: ${{ parameters.build_py_parameters }} |