mirror of
https://github.com/saymrwulf/onnxruntime.git
synced 2026-06-30 03:37:44 +00:00
### Description This PR is to update the win-ort-main branch to the tip main branch as of 2025-01-16. ### Motivation and Context This update includes the OpenVino fix for debug builds. --------- Signed-off-by: Liqun Fu <liqfu@microsoft.com> Signed-off-by: Liqun Fu <liqun.fu@microsoft.com> Signed-off-by: Junze Wu <junze.wu@intel.com> Signed-off-by: dependabot[bot] <support@github.com> Signed-off-by: Jianhui Dai <jianhui.j.dai@intel.com> Co-authored-by: Yueqing Zhang <yuz75@Pitt.edu> Co-authored-by: amancini-N <63410090+amancini-N@users.noreply.github.com> Co-authored-by: Adrian Lizarraga <adlizarraga@microsoft.com> Co-authored-by: liqun Fu <liqfu@microsoft.com> Co-authored-by: Guenther Schmuelling <guschmue@microsoft.com> Co-authored-by: Yifan Li <109183385+yf711@users.noreply.github.com> Co-authored-by: yf711 <yifanl@microsoft.com> Co-authored-by: Wanming Lin <wanming.lin@intel.com> Co-authored-by: wejoncy <wejoncy@163.com> Co-authored-by: wejoncy <wejoncy@.com> Co-authored-by: Scott McKay <skottmckay@gmail.com> Co-authored-by: Changming Sun <chasun@microsoft.com> Co-authored-by: Jean-Michaël Celerier <jeanmichael.celerier+github@gmail.com> Co-authored-by: Dmitry Deshevoy <mityada@gmail.com> Co-authored-by: xhcao <xinghua.cao@intel.com> Co-authored-by: Yueqing Zhang <yueqingz@amd.com> Co-authored-by: Yulong Wang <7679871+fs-eire@users.noreply.github.com> Co-authored-by: Jiajia Qin <jiajiaqin@microsoft.com> Co-authored-by: Wu, Junze <junze.wu@intel.com> Co-authored-by: Jian Chen <cjian@microsoft.com> Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> Co-authored-by: Matthieu Darbois <mayeut@users.noreply.github.com> Co-authored-by: Prathik Rao <prathik.rao@gmail.com> Co-authored-by: wonchung-microsoft <wonchung@microsoft.com> Co-authored-by: Vincent Wang <wangwchpku@outlook.com> Co-authored-by: PARK DongHa <luncliff@gmail.com> Co-authored-by: Hector Li <hecli@microsoft.com> Co-authored-by: Sam Webster <13457618+samwebster@users.noreply.github.com> Co-authored-by: Adrian Lizarraga <adrianlm2@gmail.com> Co-authored-by: Preetha Veeramalai <preetha.veeramalai@intel.com> Co-authored-by: jatinwadhwa921 <jatin.wadhwa@intel.com> Co-authored-by: Satya Kumar Jandhyala <satya.k.jandhyala@gmail.com> Co-authored-by: Corentin Maravat <101636442+cocotdf@users.noreply.github.com> Co-authored-by: Xiaoyu <85524621+xiaoyu-work@users.noreply.github.com> Co-authored-by: Tianlei Wu <tlwu@microsoft.com> Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com> Co-authored-by: Jie Chen <jie.a.chen@intel.com> Co-authored-by: Jianhui Dai <jianhui.j.dai@intel.com> Co-authored-by: Copilot <175728472+Copilot@users.noreply.github.com> Co-authored-by: Edward Chen <18449977+edgchen1@users.noreply.github.com> Co-authored-by: Baiju Meswani <bmeswani@microsoft.com> Co-authored-by: kunal-vaishnavi <115581922+kunal-vaishnavi@users.noreply.github.com> Co-authored-by: Justin Chu <justinchuby@users.noreply.github.com> Co-authored-by: Copilot Autofix powered by AI <62310815+github-advanced-security[bot]@users.noreply.github.com> Co-authored-by: Ted Themistokleous <107195283+TedThemistokleous@users.noreply.github.com> Co-authored-by: Jeff Daily <jeff.daily@amd.com> Co-authored-by: Artur Wojcik <artur.wojcik@outlook.com> Co-authored-by: Ted Themistokleous <tedthemistokleous@amd.com> Co-authored-by: Xinya Zhang <Xinya.Zhang@amd.com> Co-authored-by: ikalinic <ilija.kalinic@amd.com> Co-authored-by: sstamenk <sstamenk@amd.com> Co-authored-by: Yi-Hong Lyu <yilyu@microsoft.com> Co-authored-by: Ti-Tai Wang <titaiwang@microsoft.com>
95 lines
3.7 KiB
TypeScript
95 lines
3.7 KiB
TypeScript
// Copyright (c) Microsoft Corporation. All rights reserved.
|
|
// Licensed under the MIT License.
|
|
|
|
import { Backend, env, InferenceSession, InferenceSessionHandler } from 'onnxruntime-common';
|
|
|
|
import { initializeOrtEp, initializeWebAssemblyAndOrtRuntime } from './wasm/proxy-wrapper';
|
|
import { OnnxruntimeWebAssemblySessionHandler } from './wasm/session-handler-inference';
|
|
|
|
/**
|
|
* This function initializes all flags for WebAssembly.
|
|
*
|
|
* Those flags are accessible from `ort.env.wasm`. Users are allow to set those flags before the first inference session
|
|
* being created, to override default value.
|
|
*/
|
|
export const initializeFlags = (): void => {
|
|
if (typeof env.wasm.initTimeout !== 'number' || env.wasm.initTimeout < 0) {
|
|
env.wasm.initTimeout = 0;
|
|
}
|
|
|
|
if (env.wasm.simd === false) {
|
|
// eslint-disable-next-line no-console
|
|
console.warn(
|
|
'Deprecated property "env.wasm.simd" is set to false. ' +
|
|
'non-SIMD build is no longer provided, and this setting will be ignored.',
|
|
);
|
|
}
|
|
|
|
if (typeof env.wasm.proxy !== 'boolean') {
|
|
env.wasm.proxy = false;
|
|
}
|
|
|
|
if (typeof env.wasm.trace !== 'boolean') {
|
|
env.wasm.trace = false;
|
|
}
|
|
|
|
if (typeof env.wasm.numThreads !== 'number' || !Number.isInteger(env.wasm.numThreads) || env.wasm.numThreads <= 0) {
|
|
// The following logic only applies when `ort.env.wasm.numThreads` is not set by user. We will always honor user's
|
|
// setting if it is provided.
|
|
|
|
// Browser: when crossOriginIsolated is false, SharedArrayBuffer is not available so WebAssembly threads will not
|
|
// work. In this case, we will set numThreads to 1.
|
|
//
|
|
// There is an exception: when the browser is configured to force-enable SharedArrayBuffer (e.g. Chromuim with
|
|
// --enable-features=SharedArrayBuffer), it is possible that `self.crossOriginIsolated` is false and
|
|
// SharedArrayBuffer is available at the same time. This is usually for testing. In this case, we will still set
|
|
// numThreads to 1 here. If we want to enable multi-threading in test, we should set `ort.env.wasm.numThreads` to a
|
|
// value greater than 1.
|
|
if (typeof self !== 'undefined' && !self.crossOriginIsolated) {
|
|
env.wasm.numThreads = 1;
|
|
} else {
|
|
const numCpuLogicalCores =
|
|
typeof navigator === 'undefined' ? require('node:os').cpus().length : navigator.hardwareConcurrency;
|
|
env.wasm.numThreads = Math.min(4, Math.ceil((numCpuLogicalCores || 1) / 2));
|
|
}
|
|
}
|
|
};
|
|
|
|
export class OnnxruntimeWebAssemblyBackend implements Backend {
|
|
/**
|
|
* This function initializes the WebAssembly backend.
|
|
*
|
|
* This function will be called only once for each backend name. It will be called the first time when
|
|
* `ort.InferenceSession.create()` is called with a registered backend name.
|
|
*
|
|
* @param backendName - the registered backend name.
|
|
*/
|
|
async init(backendName: string): Promise<void> {
|
|
// populate wasm flags
|
|
initializeFlags();
|
|
|
|
// init wasm
|
|
await initializeWebAssemblyAndOrtRuntime();
|
|
|
|
// performe EP specific initialization
|
|
await initializeOrtEp(backendName);
|
|
}
|
|
createInferenceSessionHandler(
|
|
path: string,
|
|
options?: InferenceSession.SessionOptions,
|
|
): Promise<InferenceSessionHandler>;
|
|
createInferenceSessionHandler(
|
|
buffer: Uint8Array,
|
|
options?: InferenceSession.SessionOptions,
|
|
): Promise<InferenceSessionHandler>;
|
|
async createInferenceSessionHandler(
|
|
pathOrBuffer: string | Uint8Array,
|
|
options?: InferenceSession.SessionOptions,
|
|
): Promise<InferenceSessionHandler> {
|
|
const handler = new OnnxruntimeWebAssemblySessionHandler();
|
|
await handler.loadModel(pathOrBuffer, options);
|
|
return Promise.resolve(handler);
|
|
}
|
|
}
|
|
|
|
export const wasmBackend = new OnnxruntimeWebAssemblyBackend();
|