mirror of
https://github.com/saymrwulf/onnxruntime.git
synced 2026-05-15 20:50:42 +00:00
**Description**: This PR adds support for "XNNPACK EP" in ORTWeb and changes the behavior of how ORTWeb deals with "backends", or "EPs" in API. **Background**: Term "backend" is introduced in ONNX.js to representing a TypeScript type which implements a "backend" interface, which is a similar but different concept to ORT's EP (execution provider). There was 3 backends in ONNX.js: "cpu", "wasm" and "webgl". When ORT Web is launched, the concept is derived to help users to integrate smoothly. Technically, when "wasm" backend is used, users need to also specify "EP" in the session options. Considering it may get complicated and confused for users to figure out the difference between "backend" and "EP", the JS API hide the "backend" concept and made a mapping between names, backends and EPs: "webgl" (Name) <==> "onnxjsBackend" (Backend) "wasm" (Name) <==> "wasmBackend" (Backend) <==> "CPU" (EP) **Details**: The following changes are applied in this PR: 1. allow multi-registration for backends using the same name. This is for use scenarios where both "onnxruntime-node" and "onnxruntime-web" are consumed in a Node.js App ( so "cpu" will be registered twice in this scenario. ) 2. re-assign priority values to backends. I give 100 as base to "cpu" for node and react_native, and 10 as base to "cpu" in web. 3. add "cpu", "xnnpack" as new names of backends. 4. update onnxruntime wasm exported functions to support EP registration. 5. update implementations in ort web to handle execution providers in session options. 6. add '--use_xnnpack' as default build flag for ort-web
415 lines
15 KiB
TypeScript
415 lines
15 KiB
TypeScript
// Copyright (c) Microsoft Corporation. All rights reserved.
|
|
// Licensed under the MIT License.
|
|
|
|
import minimist from 'minimist';
|
|
import npmlog from 'npmlog';
|
|
import {Env, InferenceSession} from 'onnxruntime-common';
|
|
|
|
import {Logger} from '../lib/onnxjs/instrument';
|
|
import {Test} from '../test/test-types';
|
|
|
|
/* eslint-disable max-len */
|
|
const HELP_MESSAGE = `
|
|
test-runner-cli
|
|
|
|
Run ONNX Runtime Web tests, models, benchmarks in different environments.
|
|
|
|
Usage:
|
|
test-runner-cli <mode> ... [options]
|
|
|
|
Modes:
|
|
suite0 Run all unittests, all operator tests and node model tests that described in suite test list
|
|
suite1 Run all operator tests and node model tests that described in suite test list
|
|
model Run a single model test
|
|
unittest Run all unittests
|
|
op Run a single operator test
|
|
|
|
Options:
|
|
|
|
*** General Options ***
|
|
|
|
-h, --help Print this message.
|
|
-d, --debug Specify to run test runner in debug mode.
|
|
Debug mode outputs verbose log for test runner, sets up environment debug flag, and keeps karma not to exit after tests completed.
|
|
-b=<...>, --backend=<...> Specify one or more backend(s) to run the test upon.
|
|
Backends can be one or more of the following, splitted by comma:
|
|
webgl
|
|
wasm
|
|
xnnpack
|
|
-e=<...>, --env=<...> Specify the environment to run the test. Should be one of the following:
|
|
chrome (default)
|
|
edge (Windows only)
|
|
firefox
|
|
electron
|
|
safari (MacOS only)
|
|
node
|
|
bs (for BrowserStack tests)
|
|
-p, --profile Enable profiler.
|
|
Profiler will generate extra logs which include the information of events time consumption
|
|
-P[=<...>], --perf[=<...>] Generate performance number. Cannot be used with flag --debug.
|
|
This flag can be used with a number as value, specifying the total count of test cases to run. The test cases may be used multiple times. Default value is 10.
|
|
-c, --file-cache Enable file cache.
|
|
|
|
*** Logging Options ***
|
|
|
|
--log-verbose=<...> Set log level to verbose
|
|
--log-info=<...> Set log level to info
|
|
--log-warning=<...> Set log level to warning
|
|
--log-error=<...> Set log level to error
|
|
The 4 flags above specify the logging configuration. Each flag allows to specify one or more category(s), splitted by comma. If use the flags without value, the log level will be applied to all category.
|
|
|
|
*** Backend Options ***
|
|
|
|
--wasm-number-threads Set the WebAssembly number of threads
|
|
--wasm-init-timeout Set the timeout for WebAssembly backend initialization, in milliseconds
|
|
--wasm-enable-simd Set whether to enable SIMD
|
|
--wasm-enable-proxy Set whether to enable proxy worker
|
|
--webgl-context-id Set the WebGL context ID (webgl/webgl2)
|
|
--webgl-matmul-max-batch-size Set the WebGL matmulMaxBatchSize
|
|
--webgl-texture-cache-mode Set the WebGL texture cache mode (initializerOnly/full)
|
|
--webgl-texture-pack-mode Set the WebGL texture pack mode (true/false)
|
|
|
|
*** Browser Options ***
|
|
|
|
--no-sandbox This flag will be passed to Chrome.
|
|
Sometimes Chrome need this flag to work together with Karma.
|
|
|
|
Examples:
|
|
|
|
Run all suite0 tests:
|
|
> test-runner-cli suite0
|
|
|
|
Run single model test (test_relu) on WebAssembly backend
|
|
> test-runner-cli model test_relu --backend=wasm
|
|
|
|
Debug unittest
|
|
> test-runner-cli unittest --debug
|
|
|
|
Debug operator matmul, highlight verbose log from BaseGlContext and WebGLBackend
|
|
> test-runner-cli op matmul --backend=webgl --debug --log-verbose=BaseGlContext,WebGLBackend
|
|
|
|
Profile an ONNX model on WebGL backend
|
|
> test-runner-cli model <model_folder> --profile --backend=webgl
|
|
|
|
Run perf testing of an ONNX model on WebGL backend
|
|
> test-runner-cli model <model_folder> -b=webgl -P
|
|
`;
|
|
/* eslint-enable max-len */
|
|
|
|
export declare namespace TestRunnerCliArgs {
|
|
type Mode = 'suite0'|'suite1'|'model'|'unittest'|'op';
|
|
type Backend = 'cpu'|'webgl'|'wasm'|'onnxruntime'|'xnnpack';
|
|
type Environment = 'chrome'|'edge'|'firefox'|'electron'|'safari'|'node'|'bs';
|
|
type BundleMode = 'prod'|'dev'|'perf';
|
|
}
|
|
|
|
export interface TestRunnerCliArgs {
|
|
debug: boolean;
|
|
mode: TestRunnerCliArgs.Mode;
|
|
/**
|
|
* The parameter that used when in mode 'model' or 'op', specifying the search string for the model or op test
|
|
*/
|
|
param?: string;
|
|
backends: [TestRunnerCliArgs.Backend];
|
|
env: TestRunnerCliArgs.Environment;
|
|
|
|
/**
|
|
* Bundle Mode
|
|
*
|
|
* this field affects the behavior of Karma and Webpack.
|
|
*
|
|
* For Karma, if flag '--bundle-mode' is not set, the default behavior is 'dev'
|
|
* For Webpack, if flag '--bundle-mode' is not set, the default behavior is 'prod'
|
|
*
|
|
* For running tests, the default mode is 'dev'. If flag '--perf' is set, the mode will be set to 'perf'.
|
|
*
|
|
* Mode | Output File | Main | Source Map | Webpack Config
|
|
* ------ | --------------------- | -------------------- | ------------------ | --------------
|
|
* prod | /dist/ort.min.js | /lib/index.ts | source-map | production
|
|
* node | /dist/ort-web.node.js | /lib/index.ts | source-map | production
|
|
* dev | /test/ort.dev.js | /test/test-main.ts | inline-source-map | development
|
|
* perf | /test/ort.perf.js | /test/test-main.ts | (none) | production
|
|
*/
|
|
bundleMode: TestRunnerCliArgs.BundleMode;
|
|
|
|
logConfig: Test.Config['log'];
|
|
|
|
/**
|
|
* Whether to enable InferenceSession's profiler
|
|
*/
|
|
profile: boolean;
|
|
|
|
/**
|
|
* Whether to enable file cache
|
|
*/
|
|
fileCache: boolean;
|
|
|
|
/**
|
|
* Specify the times that test cases to run
|
|
*/
|
|
times?: number;
|
|
|
|
cpuOptions?: InferenceSession.CpuExecutionProviderOption;
|
|
cudaOptions?: InferenceSession.CudaExecutionProviderOption;
|
|
cudaFlags?: Record<string, unknown>;
|
|
wasmOptions?: InferenceSession.WebAssemblyExecutionProviderOption;
|
|
webglOptions?: InferenceSession.WebGLExecutionProviderOption;
|
|
globalEnvFlags?: Env;
|
|
noSandbox?: boolean;
|
|
}
|
|
|
|
|
|
function parseBooleanArg(arg: unknown, defaultValue: boolean): boolean;
|
|
function parseBooleanArg(arg: unknown): boolean|undefined;
|
|
function parseBooleanArg(arg: unknown, defaultValue?: boolean): boolean|undefined {
|
|
if (typeof arg === 'undefined') {
|
|
return defaultValue;
|
|
}
|
|
|
|
if (typeof arg === 'boolean') {
|
|
return arg;
|
|
}
|
|
|
|
if (typeof arg === 'number') {
|
|
return arg !== 0;
|
|
}
|
|
|
|
if (typeof arg === 'string') {
|
|
if (arg.toLowerCase() === 'true') {
|
|
return true;
|
|
}
|
|
if (arg.toLowerCase() === 'false') {
|
|
return false;
|
|
}
|
|
}
|
|
|
|
throw new TypeError(`invalid boolean arg: ${arg}`);
|
|
}
|
|
|
|
function parseLogLevel<T>(arg: T) {
|
|
let v: string[]|boolean;
|
|
if (typeof arg === 'string') {
|
|
v = arg.split(',');
|
|
} else if (Array.isArray(arg)) {
|
|
v = [];
|
|
for (const e of arg) {
|
|
v.push(...e.split(','));
|
|
}
|
|
} else {
|
|
v = arg ? true : false;
|
|
}
|
|
return v;
|
|
}
|
|
|
|
function parseLogConfig(args: minimist.ParsedArgs) {
|
|
const config: Array<{category: string; config: Logger.Config}> = [];
|
|
const verbose = parseLogLevel(args['log-verbose']);
|
|
const info = parseLogLevel(args['log-info']);
|
|
const warning = parseLogLevel(args['log-warning']);
|
|
const error = parseLogLevel(args['log-error']);
|
|
|
|
if (typeof error === 'boolean' && error) {
|
|
config.push({category: '*', config: {minimalSeverity: 'error'}});
|
|
} else if (typeof warning === 'boolean' && warning) {
|
|
config.push({category: '*', config: {minimalSeverity: 'warning'}});
|
|
} else if (typeof info === 'boolean' && info) {
|
|
config.push({category: '*', config: {minimalSeverity: 'info'}});
|
|
} else if (typeof verbose === 'boolean' && verbose) {
|
|
config.push({category: '*', config: {minimalSeverity: 'verbose'}});
|
|
}
|
|
|
|
if (Array.isArray(error)) {
|
|
config.push(...error.map(i => ({category: i, config: {minimalSeverity: 'error' as Logger.Severity}})));
|
|
}
|
|
if (Array.isArray(warning)) {
|
|
config.push(...warning.map(i => ({category: i, config: {minimalSeverity: 'warning' as Logger.Severity}})));
|
|
}
|
|
if (Array.isArray(info)) {
|
|
config.push(...info.map(i => ({category: i, config: {minimalSeverity: 'info' as Logger.Severity}})));
|
|
}
|
|
if (Array.isArray(verbose)) {
|
|
config.push(...verbose.map(i => ({category: i, config: {minimalSeverity: 'verbose' as Logger.Severity}})));
|
|
}
|
|
|
|
return config;
|
|
}
|
|
|
|
function parseCpuOptions(_args: minimist.ParsedArgs): InferenceSession.CpuExecutionProviderOption {
|
|
return {name: 'cpu'};
|
|
}
|
|
|
|
function parseCpuFlags(_args: minimist.ParsedArgs): Record<string, unknown> {
|
|
return {};
|
|
}
|
|
|
|
function parseWasmOptions(_args: minimist.ParsedArgs): InferenceSession.WebAssemblyExecutionProviderOption {
|
|
return {name: 'wasm'};
|
|
}
|
|
|
|
function parseWasmFlags(args: minimist.ParsedArgs): Env.WebAssemblyFlags {
|
|
const numThreads = args['wasm-number-threads'];
|
|
if (typeof numThreads !== 'undefined' && typeof numThreads !== 'number') {
|
|
throw new Error('Flag "wasm-number-threads" must be a number value');
|
|
}
|
|
const initTimeout = args['wasm-init-timeout'];
|
|
if (typeof initTimeout !== 'undefined' && typeof initTimeout !== 'number') {
|
|
throw new Error('Flag "wasm-init-timeout" must be a number value');
|
|
}
|
|
let simd = args['wasm-enable-simd'];
|
|
if (simd === 'true') {
|
|
simd = true;
|
|
} else if (simd === 'false') {
|
|
simd = false;
|
|
} else if (typeof simd !== 'undefined' && typeof simd !== 'boolean') {
|
|
throw new Error('Flag "wasm-enable-simd" must be a boolean value');
|
|
}
|
|
let proxy = args['wasm-enable-proxy'];
|
|
if (proxy === 'true') {
|
|
proxy = true;
|
|
} else if (proxy === 'false') {
|
|
proxy = false;
|
|
} else if (typeof proxy !== 'undefined' && typeof proxy !== 'boolean') {
|
|
throw new Error('Flag "wasm-enable-proxy" must be a boolean value');
|
|
}
|
|
return {numThreads, initTimeout, simd, proxy};
|
|
}
|
|
|
|
function parseWebglOptions(_args: minimist.ParsedArgs): InferenceSession.WebGLExecutionProviderOption {
|
|
return {name: 'webgl'};
|
|
}
|
|
|
|
function parseWebglFlags(args: minimist.ParsedArgs): Env.WebGLFlags {
|
|
const contextId = args['webgl-context-id'];
|
|
if (contextId !== undefined && contextId !== 'webgl' && contextId !== 'webgl2') {
|
|
throw new Error('Flag "webgl-context-id" is invalid');
|
|
}
|
|
const matmulMaxBatchSize = args['webgl-matmul-max-batch-size'];
|
|
if (matmulMaxBatchSize !== undefined && typeof matmulMaxBatchSize !== 'number') {
|
|
throw new Error('Flag "webgl-matmul-max-batch-size" must be a number value');
|
|
}
|
|
const textureCacheMode = args['webgl-texture-cache-mode'];
|
|
if (textureCacheMode !== undefined && textureCacheMode !== 'initializerOnly' && textureCacheMode !== 'full') {
|
|
throw new Error('Flag "webgl-texture-cache-mode" is invalid');
|
|
}
|
|
const pack = args['webgl-texture-pack-mode'];
|
|
if (pack !== undefined && typeof pack !== 'boolean') {
|
|
throw new Error('Flag "webgl-texture-pack-mode" is invalid');
|
|
}
|
|
const async = args['webgl-async'];
|
|
if (async !== undefined && typeof async !== 'boolean') {
|
|
throw new Error('Flag "webgl-async" is invalid');
|
|
}
|
|
return {contextId, matmulMaxBatchSize, textureCacheMode, pack};
|
|
}
|
|
|
|
function parseGlobalEnvFlags(args: minimist.ParsedArgs): Env {
|
|
const wasmFlags = parseWasmFlags(args);
|
|
const webglFlags = parseWebglFlags(args);
|
|
const cpuFlags = parseCpuFlags(args);
|
|
return {webgl: webglFlags, wasm: wasmFlags, cpuFlags};
|
|
}
|
|
|
|
export function parseTestRunnerCliArgs(cmdlineArgs: string[]): TestRunnerCliArgs {
|
|
const args = minimist(cmdlineArgs);
|
|
|
|
if (args.help || args.h) {
|
|
console.log(HELP_MESSAGE);
|
|
process.exit();
|
|
}
|
|
|
|
// Option: -d, --debug
|
|
const debug = parseBooleanArg(args.debug || args.d, false);
|
|
if (debug) {
|
|
npmlog.level = 'verbose';
|
|
}
|
|
npmlog.verbose('TestRunnerCli.Init', 'Parsing commandline arguments...');
|
|
|
|
const mode = args._.length === 0 ? 'suite0' : args._[0];
|
|
|
|
// Option: -e=<...>, --env=<...>
|
|
const envArg = args.env || args.e;
|
|
const env = (typeof envArg !== 'string') ? 'chrome' : envArg;
|
|
if (['chrome', 'edge', 'firefox', 'electron', 'safari', 'node', 'bs'].indexOf(env) === -1) {
|
|
throw new Error(`not supported env ${env}`);
|
|
}
|
|
|
|
// Option: -b=<...>, --backend=<...>
|
|
const browserBackends = ['webgl', 'wasm', 'xnnpack'];
|
|
const nodejsBackends = ['cpu', 'wasm'];
|
|
const backendArgs = args.backend || args.b;
|
|
const backend =
|
|
(typeof backendArgs !== 'string') ? (env === 'node' ? nodejsBackends : browserBackends) : backendArgs.split(',');
|
|
for (const b of backend) {
|
|
if ((env !== 'node' && browserBackends.indexOf(b) === -1) || (env === 'node' && nodejsBackends.indexOf(b) === -1)) {
|
|
throw new Error(`backend ${b} is not supported in env ${env}`);
|
|
}
|
|
}
|
|
|
|
const globalEnvFlags = parseGlobalEnvFlags(args);
|
|
|
|
// Options:
|
|
// --log-verbose=<...>
|
|
// --log-info=<...>
|
|
// --log-warning=<...>
|
|
// --log-error=<...>
|
|
const logConfig = parseLogConfig(args);
|
|
globalEnvFlags.logLevel = logConfig[0]?.config.minimalSeverity;
|
|
// Option: -p, --profile
|
|
const profile = (args.profile || args.p) ? true : false;
|
|
if (profile) {
|
|
logConfig.push({category: 'Profiler.session', config: {minimalSeverity: 'verbose'}});
|
|
logConfig.push({category: 'Profiler.node', config: {minimalSeverity: 'verbose'}});
|
|
logConfig.push({category: 'Profiler.op', config: {minimalSeverity: 'verbose'}});
|
|
logConfig.push({category: 'Profiler.backend', config: {minimalSeverity: 'verbose'}});
|
|
globalEnvFlags.logLevel = 'verbose';
|
|
}
|
|
|
|
// Option: -P[=<...>], --perf[=<...>]
|
|
const perfArg = (args.perf || args.P);
|
|
const perf = perfArg ? true : false;
|
|
const times = (typeof perfArg === 'number') ? perfArg : 10;
|
|
if (debug && perf) {
|
|
throw new Error('Flag "perf" cannot be used together with flag "debug".');
|
|
}
|
|
if (perf && (mode !== 'model')) {
|
|
throw new Error('Flag "perf" can only be used in mode "model".');
|
|
}
|
|
if (perf) {
|
|
logConfig.push({category: 'TestRunner.Perf', config: {minimalSeverity: 'verbose'}});
|
|
}
|
|
|
|
// Option: -c, --file-cache
|
|
const fileCache = parseBooleanArg(args['file-cache'] || args.c, false);
|
|
|
|
const cpuOptions = parseCpuOptions(args);
|
|
const wasmOptions = parseWasmOptions(args);
|
|
|
|
const webglOptions = parseWebglOptions(args);
|
|
|
|
// Option: --no-sandbox
|
|
const noSandbox = !!args['no-sandbox'];
|
|
|
|
npmlog.verbose('TestRunnerCli.Init', ` Mode: ${mode}`);
|
|
npmlog.verbose('TestRunnerCli.Init', ` Env: ${env}`);
|
|
npmlog.verbose('TestRunnerCli.Init', ` Debug: ${debug}`);
|
|
npmlog.verbose('TestRunnerCli.Init', ` Backend: ${backend}`);
|
|
npmlog.verbose('TestRunnerCli.Init', 'Parsing commandline arguments... DONE');
|
|
|
|
return {
|
|
debug,
|
|
mode: mode as TestRunnerCliArgs['mode'],
|
|
param: args._.length > 1 ? args._[1] : undefined,
|
|
backends: backend as TestRunnerCliArgs['backends'],
|
|
bundleMode: perf ? 'perf' : 'dev',
|
|
env: env as TestRunnerCliArgs['env'],
|
|
logConfig,
|
|
profile,
|
|
times: perf ? times : undefined,
|
|
fileCache,
|
|
cpuOptions,
|
|
webglOptions,
|
|
wasmOptions,
|
|
globalEnvFlags,
|
|
noSandbox
|
|
};
|
|
}
|