mirror of
https://github.com/saymrwulf/onnxruntime.git
synced 2026-06-30 03:37:44 +00:00
### Description This PR is to update the win-ort-main branch to the tip main branch as of 2025-01-23. ### PR List ddf0d377a7 [QNN EP] Add LoggingManager::HasDefaultLogger() to provider bridge API (#23467) 05fbbdf91f [QNN EP] Make QNN EP a shared library (#23120) 1336566d7f Add custom vcpkg ports (#23456) 2e1173c411 Update the compile flags for vcpkg packages (#23455) 1f628a9858 [Mobile] Add BrowserStack Android MAUI Test (#23383) 009cae0ec8 [js/webgpu] Optimize ConvTranspose (Continue) (#23429) 04a4a694cb Use onnx_protobuf.h to suppress some GCC warnings (#23453) 2e3b62b4b0 Suppress some strict-aliasing related warnings in WebGPU EP (#23454) b708f9b1dc Bump ruff from 0.9.1 to 0.9.2 (#23427) c0afc66b2a [WebNN] Remove workarounds for TFLite backend (#23406) 8a821ff7f9 Bump vite from 6.0.7 to 6.0.11 in /js/web/test/e2e/exports/testcases/vite-default (#23446) 220c1a203e Make ORT and Dawn use the same protobuf/abseil source code (#23447) b7b5792147 Change MacOS-13 to ubuntu on for android-java-api-aar-test.yml. (#23444) 19d0d2a30f WIP: Dp4MatMulNBits accuracy level 4 matmul for WebGPU EP (#23365) 95b8effbc4 [QNN EP]: Clean up QNN logging resources if an error occurs during initialization (#23435) 626134c5b5 Bump clang-format from 19.1.6 to 19.1.7 (#23428) 0cf975301f Fix eigen external deps (#23439) f9440aedce Moving RN_CI Android Testing to Linux (#23422) 1aa5902ff4 [QNN EP] workaround for QNN validation bug for Tanh with uint16 quantized output (#23432) 7f5582a0e2 Seperate RN andriod and IOS into 2 separated Stages. (#23400) 73deac2e7f Implement some missing element wise Add/Sub/Mul/Div/Neg operations for CPU and CUDA EPs (#23090) 949fe42af4 Upgrade Java version from react-native/android to Java 17 (#23066) 0892c23463 Update Qnn SDK default version to 2.30 (#23411) 94c099bcec Fix type cast build error (#23423) d633e571d1 [WebNN EP] Fix AddInitializersToSkip issues (#23354) e988ef00e2 [QNN EP] Fix regression for MatMul with two quantized/dynamic uint16 inputs (#23419) 7538795f6b Update onnxruntime binary size checks ci pipeline's docker image (#23405) 6c5ea41cad Revert "[QNN EP] Clean up correctly from a partial setup (#23320)" (#23420) e866804bbe Enable comprehension simplification in ruff rules (#23414) 0a5f1f392c bugfix: string_view of invalid memory (#23417) 4cc38e0277 fix crash when first input of BatchNormalization is 1-D (#23387) 033441487f Target py310 and modernize codebase with ruff (#23401) 87341ac010 [QNN EP] Fix segfault when unregistering HTP shared memory handles (#23402) ### Motivation and Context This update includes the change to make QNN-EP a shared library. --------- Signed-off-by: dependabot[bot] <support@github.com> Co-authored-by: Adrian Lizarraga <adlizarraga@microsoft.com> Co-authored-by: Justin Chu <justinchuby@users.noreply.github.com> Co-authored-by: Yulong Wang <7679871+fs-eire@users.noreply.github.com> Co-authored-by: Edward Chen <18449977+edgchen1@users.noreply.github.com> Co-authored-by: Changming Sun <chasun@microsoft.com> Co-authored-by: Peishen Yan <peishen.yan@intel.com> Co-authored-by: Tianlei Wu <tlwu@microsoft.com> Co-authored-by: Hector Li <hecli@microsoft.com> Co-authored-by: Jian Chen <cjian@microsoft.com> Co-authored-by: Alexis Tsogias <1114095+Zyrin@users.noreply.github.com> Co-authored-by: junchao-zhao <68935141+junchao-loongson@users.noreply.github.com> Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com> Co-authored-by: sushraja-msft <44513542+sushraja-msft@users.noreply.github.com> Co-authored-by: Wanming Lin <wanming.lin@intel.com> Co-authored-by: Jiajia Qin <jiajiaqin@microsoft.com> Co-authored-by: Caroline Zhu <wolfivyaura@gmail.com>
77 lines
3.1 KiB
Python
77 lines
3.1 KiB
Python
import argparse
|
|
import os
|
|
import sys
|
|
from concurrent.futures import ThreadPoolExecutor
|
|
from threading import Event, Thread # noqa: F401
|
|
|
|
from azureml._run_impl.run_watcher import RunWatcher
|
|
from azureml.core import Experiment, Run, Workspace # noqa: F401
|
|
from requests import Session
|
|
|
|
parser = argparse.ArgumentParser()
|
|
parser.add_argument(
|
|
"--subscription", type=str, default="ea482afa-3a32-437c-aa10-7de928a9e793"
|
|
) # AI Platform GPU - MLPerf
|
|
parser.add_argument(
|
|
"--resource_group", type=str, default="onnx_training", help="Azure resource group containing the AzureML Workspace"
|
|
)
|
|
parser.add_argument(
|
|
"--workspace", type=str, default="ort_training_dev", help="AzureML Workspace to run the Experiment in"
|
|
)
|
|
parser.add_argument("--experiment", type=str, default="BERT-ONNX", help="Name of the AzureML Experiment")
|
|
parser.add_argument("--run", type=str, default=None, help="The Experiment run to watch (defaults to the latest run)")
|
|
|
|
parser.add_argument("--remote_dir", type=str, default=None, help="Specify a remote directory to sync (read) from")
|
|
parser.add_argument("--local_dir", type=str, default=None, help="Specify a local directory to sync (write) to")
|
|
args = parser.parse_args()
|
|
|
|
# Validate
|
|
if (args.remote_dir and not args.local_dir) or (not args.remote_dir and args.local_dir):
|
|
print("Must specify both remote_dir and local_dir to sync files from Experiment")
|
|
sys.exit()
|
|
|
|
# Get the AzureML Workspace the Experiment is running in
|
|
ws = Workspace.get(name=args.workspace, subscription_id=args.subscription, resource_group=args.resource_group)
|
|
|
|
# Find the Experiment
|
|
experiment = Experiment(workspace=ws, name=args.experiment)
|
|
|
|
# Find the Run
|
|
runs = list(experiment.get_runs())
|
|
|
|
if len(runs) == 0:
|
|
print(f"No runs found in Experiment '{args.experiment}'")
|
|
sys.exit()
|
|
|
|
run = runs[0]
|
|
if args.run is not None:
|
|
try:
|
|
run = next(r for r in runs if r.id == args.run)
|
|
except StopIteration:
|
|
print(f"Run id '{args.run}' not found in Experiment '{args.experiment}'")
|
|
sys.exit()
|
|
|
|
# Optionally start synchronizing files from Run
|
|
if args.remote_dir and args.local_dir:
|
|
local_root = os.path.normpath(args.local_dir)
|
|
remote_root = args.remote_dir
|
|
|
|
if run.get_status() in ["Completed", "Failed", "Canceled"]:
|
|
print(f"Downloading Experiment files from remote directory: '{remote_root}' to local directory: '{local_root}'")
|
|
files = [f for f in run.get_file_names() if f.startswith(remote_root)]
|
|
for remote_path in files:
|
|
local_path = os.path.join(local_root, os.path.basename(remote_path))
|
|
run.download_file(remote_path, local_path)
|
|
else:
|
|
executor = ThreadPoolExecutor()
|
|
event = Event()
|
|
session = Session()
|
|
|
|
print(f"Streaming Experiment files from remote directory: '{remote_root}' to local directory: '{local_root}'")
|
|
watcher = RunWatcher(
|
|
run, local_root=local_root, remote_root=remote_root, executor=executor, event=event, session=session
|
|
)
|
|
executor.submit(watcher.refresh_requeue)
|
|
|
|
# Block until run completes, to keep updating the files (if streaming)
|
|
run.wait_for_completion(show_output=True)
|