onnxruntime/tools/python/convert_onnx_models_to_ort.py

#!/usr/bin/env python3
# Copyright (c) Microsoft Corporation. All rights reserved.
# Licensed under the MIT License.

import argparse
import glob
import os
import pathlib
import re

import onnxruntime as ort


def _create_config_file_from_ort_models(model_path: pathlib.Path, enable_type_reduction: bool):
    filename = 'required_operators_and_types.config' if enable_type_reduction else 'required_operators.config'
    config_file_path = model_path.joinpath(filename)

    print("Creating configuration file for operators required by ORT format models in {}.".format(config_file_path))
    from util.ort_format_model import create_config_from_models
    create_config_from_models(model_path, config_file_path, enable_type_reduction)


def _create_session_options(optimization_level: ort.GraphOptimizationLevel,
                            output_model_path: pathlib.Path,
                            custom_op_library: pathlib.Path):
    so = ort.SessionOptions()
    so.optimized_model_filepath = str(output_model_path)
    so.graph_optimization_level = optimization_level

    if custom_op_library:
        so.register_custom_ops_library(str(custom_op_library))

    return so


def _convert(model_path: pathlib.Path, optimization_level: ort.GraphOptimizationLevel, use_nnapi: bool,
             custom_op_library: pathlib.Path, create_optimized_onnx_model: bool):
    models = glob.glob(os.path.join(model_path, '**', '*.onnx'), recursive=True)

    if len(models) == 0:
        raise ValueError("No .onnx files were found in " + model_path)

    providers = ['CPUExecutionProvider']
    if use_nnapi:
        # providers are priority based, so register NNAPI first
        providers.insert(0, 'NnapiExecutionProvider')

    for model in models:
        # ignore any files with an extension of .optimized.onnx which are presumably from previous executions
        # of this script
        if re.match(r'.*\.optimized\.onnx$', model, flags=re.IGNORECASE):
            print('Ignoring ' + model)
            continue

        # create .ort file in same dir as original onnx model
        ort_target_path = re.sub(r'\.onnx$', '.ort', model)

        if create_optimized_onnx_model:
            # Create an ONNX file with the same optimizations that will be used for the ORT format file.
            # This allows the ONNX equivalent of the ORT format model to be easily viewed in Netron.
            optimized_target_path = re.sub(r'\.onnx$', '.optimized.onnx', model, flags=re.IGNORECASE)
            so = _create_session_options(optimization_level, optimized_target_path, custom_op_library)

            print("Saving optimized ONNX model {} to {}".format(model, optimized_target_path))
            _ = ort.InferenceSession(model, sess_options=so, providers=providers)

        # Load ONNX model, optimize, and save to ORT format
        so = _create_session_options(optimization_level, ort_target_path, custom_op_library)
        so.add_session_config_entry('session.save_model_format', 'ORT')

        print("Converting optimized ONNX model to ORT format model {}".format(ort_target_path))
        _ = ort.InferenceSession(model, sess_options=so, providers=providers)

        # orig_size = os.path.getsize(onnx_target_path)
        # new_size = os.path.getsize(ort_target_path)
        # print("Serialized {} to {}. Sizes: orig={} new={} diff={} new:old={:.4f}:1.0".format(
        #     onnx_target_path, ort_target_path, orig_size, new_size, new_size - orig_size, new_size / orig_size))


def _get_optimization_level(level):
    if level == 'disable':
        return ort.GraphOptimizationLevel.ORT_DISABLE_ALL
    if level == 'basic':
        # Constant folding and other optimizations that only use ONNX operators
        return ort.GraphOptimizationLevel.ORT_ENABLE_BASIC
    if level == 'extended':
        # Optimizations using custom operators, excluding NCHWc optimizations
        return ort.GraphOptimizationLevel.ORT_ENABLE_EXTENDED
    if level == 'all':
        # all optimizations, including NCHWc (which has hardware specific logic)
        print('WARNING: Enabling layout optimizations is not recommended unless the ORT format model will be executed '
              'on the same hardware used to create the model.')
        return ort.GraphOptimizationLevel.ORT_ENABLE_ALL

    raise ValueError('Invalid optimization level of ' + level)


def parse_args():
    parser = argparse.ArgumentParser(
        os.path.basename(__file__),
        description='''Convert the ONNX format model/s in the provided directory to ORT format models.
        All files with a `.onnx` extension will be processed. For each one, an ORT format model will be created in the
        same directory. A configuration file will also be created called `required_operators.config`, and will contain
        the list of required operators for all converted models.
        This configuration file should be used as input to the minimal build via the `--include_ops_by_config`
        parameter.
        '''
    )

    parser.add_argument('--use_nnapi', action='store_true',
                        help='Enable the NNAPI Execution Provider when creating models and determining required '
                             'operators. Note that this will limit the optimizations possible on nodes that the '
                             'NNAPI execution provider takes, in order to preserve those nodes in the ORT format '
                             'model.')

    parser.add_argument('--optimization_level', default='extended',
                        choices=['disable', 'basic', 'extended', 'all'],
                        help="Level to optimize ONNX model with, prior to converting to ORT format model. "
                             "These map to the onnxruntime.GraphOptimizationLevel values. "
                             "NOTE: It is NOT recommended to use 'all' unless you are creating the ORT format model on "
                             "the device you will run it on, as the generated model may not be valid on other hardware."
                        )

    parser.add_argument('--enable_type_reduction', action='store_true',
                        help='Add operator specific type information to the configuration file to potentially reduce '
                             'the types supported by individual operator implementations.')

    parser.add_argument('--custom_op_library', type=pathlib.Path, default=None,
                        help='Provide path to shared library containing custom operator kernels to register.')

    parser.add_argument('--save_optimized_onnx_model', action='store_true',
                        help='Save the optimized version of each ONNX model. '
                             'This will have the same optimizations applied as the ORT format model.')

    parser.add_argument('model_path', type=pathlib.Path,
                        help='Provide path to directory containing ONNX model/s to convert. '
                             'All files with a .onnx extension, including in subdirectories, will be processed.')

    return parser.parse_args()


def main():
    args = parse_args()

    model_path = args.model_path.resolve()
    custom_op_library = args.custom_op_library.resolve() if args.custom_op_library else None

    if not model_path.is_dir():
        raise FileNotFoundError('Model path {} is not a directory.'.format(model_path))

    if custom_op_library and not custom_op_library.is_file():
        raise FileNotFoundError("Unable to find custom operator library '{}'".format(custom_op_library))

    optimization_level = _get_optimization_level(args.optimization_level)
    _convert(model_path, optimization_level, args.use_nnapi, custom_op_library, args.save_optimized_onnx_model)
    _create_config_file_from_ort_models(model_path, args.enable_type_reduction)


if __name__ == '__main__':
    main()
Add ability to track per operator types in reduced build config. (#6428) * Add ability to generate configuration that includes required types for individual operators, to allow build size reduction based on that. - Add python bindings for ORT format models - Add script to update bindings and help info - Add parsing of ORT format models - Add ability to enable type reduction to config generation - Update build.py to only allow operator/type reduction via config - simpler to require config to be generated first - can't mix a type aware (ORT format model only) and non-type aware config as that may result in insufficient types being enabled - Add script to create reduced build config - Update CIs 2021-01-28 21:59:51 +00:00			`#!/usr/bin/env python3`
Update conversion script and process to simplify creating ORT format models and a minimal build (#5217) * Update conversion script and process to simplify creating ORT format models and a minimal build. 2020-09-18 08:49:54 +00:00			`# Copyright (c) Microsoft Corporation. All rights reserved.`
			`# Licensed under the MIT License.`

			`import argparse`
			`import glob`
			`import os`
Update ORT model conversion script to support custom ops (#6701) * Add support for custom ops library to the ORT model conversion script Simplify model conversion now that we read ops from the ORT format model. Enable custom ops in the python bindings if custom ops are turned on in a minimal build. * Add test of model conversion involving custom ops. 2021-02-17 02:52:39 +00:00			`import pathlib`
Update conversion script and process to simplify creating ORT format models and a minimal build (#5217) * Update conversion script and process to simplify creating ORT format models and a minimal build. 2020-09-18 08:49:54 +00:00			`import re`

			`import onnxruntime as ort`


Update ORT model conversion script to support custom ops (#6701) * Add support for custom ops library to the ORT model conversion script Simplify model conversion now that we read ops from the ORT format model. Enable custom ops in the python bindings if custom ops are turned on in a minimal build. * Add test of model conversion involving custom ops. 2021-02-17 02:52:39 +00:00			`def _create_config_file_from_ort_models(model_path: pathlib.Path, enable_type_reduction: bool):`
			`filename = 'required_operators_and_types.config' if enable_type_reduction else 'required_operators.config'`
			`config_file_path = model_path.joinpath(filename)`

Add ability to track per operator types in reduced build config. (#6428) * Add ability to generate configuration that includes required types for individual operators, to allow build size reduction based on that. - Add python bindings for ORT format models - Add script to update bindings and help info - Add parsing of ORT format models - Add ability to enable type reduction to config generation - Update build.py to only allow operator/type reduction via config - simpler to require config to be generated first - can't mix a type aware (ORT format model only) and non-type aware config as that may result in insufficient types being enabled - Add script to create reduced build config - Update CIs 2021-01-28 21:59:51 +00:00			`print("Creating configuration file for operators required by ORT format models in {}.".format(config_file_path))`
			`from util.ort_format_model import create_config_from_models`
Update ORT model conversion script to support custom ops (#6701) * Add support for custom ops library to the ORT model conversion script Simplify model conversion now that we read ops from the ORT format model. Enable custom ops in the python bindings if custom ops are turned on in a minimal build. * Add test of model conversion involving custom ops. 2021-02-17 02:52:39 +00:00			`create_config_from_models(model_path, config_file_path, enable_type_reduction)`


			`def _create_session_options(optimization_level: ort.GraphOptimizationLevel,`
			`output_model_path: pathlib.Path,`
			`custom_op_library: pathlib.Path):`
			`so = ort.SessionOptions()`
			`so.optimized_model_filepath = str(output_model_path)`
			`so.graph_optimization_level = optimization_level`

			`if custom_op_library:`
			`so.register_custom_ops_library(str(custom_op_library))`
Update conversion script and process to simplify creating ORT format models and a minimal build (#5217) * Update conversion script and process to simplify creating ORT format models and a minimal build. 2020-09-18 08:49:54 +00:00
Update ORT model conversion script to support custom ops (#6701) * Add support for custom ops library to the ORT model conversion script Simplify model conversion now that we read ops from the ORT format model. Enable custom ops in the python bindings if custom ops are turned on in a minimal build. * Add test of model conversion involving custom ops. 2021-02-17 02:52:39 +00:00			`return so`
Update conversion script and process to simplify creating ORT format models and a minimal build (#5217) * Update conversion script and process to simplify creating ORT format models and a minimal build. 2020-09-18 08:49:54 +00:00

Update ORT model conversion script to support custom ops (#6701) * Add support for custom ops library to the ORT model conversion script Simplify model conversion now that we read ops from the ORT format model. Enable custom ops in the python bindings if custom ops are turned on in a minimal build. * Add test of model conversion involving custom ops. 2021-02-17 02:52:39 +00:00			`def _convert(model_path: pathlib.Path, optimization_level: ort.GraphOptimizationLevel, use_nnapi: bool,`
			`custom_op_library: pathlib.Path, create_optimized_onnx_model: bool):`
[ORT Mobile] ORT Minimal E2E CI (#5200) * Modify the ort minimal CI to ort minimal e2e ci 2020-09-19 08:43:22 +00:00			`models = glob.glob(os.path.join(model_path, '*', '.onnx'), recursive=True)`
Update conversion script and process to simplify creating ORT format models and a minimal build (#5217) * Update conversion script and process to simplify creating ORT format models and a minimal build. 2020-09-18 08:49:54 +00:00
			`if len(models) == 0:`
			`raise ValueError("No .onnx files were found in " + model_path)`

Update ORT model conversion script to support custom ops (#6701) * Add support for custom ops library to the ORT model conversion script Simplify model conversion now that we read ops from the ORT format model. Enable custom ops in the python bindings if custom ops are turned on in a minimal build. * Add test of model conversion involving custom ops. 2021-02-17 02:52:39 +00:00			`providers = ['CPUExecutionProvider']`
			`if use_nnapi:`
			`# providers are priority based, so register NNAPI first`
			`providers.insert(0, 'NnapiExecutionProvider')`

			`for model in models:`
			`# ignore any files with an extension of .optimized.onnx which are presumably from previous executions`
			`# of this script`
			`if re.match(r'.*\.optimized\.onnx$', model, flags=re.IGNORECASE):`
			`print('Ignoring ' + model)`
			`continue`

			`# create .ort file in same dir as original onnx model`
			`ort_target_path = re.sub(r'\.onnx$', '.ort', model)`

			`if create_optimized_onnx_model:`
			`# Create an ONNX file with the same optimizations that will be used for the ORT format file.`
			`# This allows the ONNX equivalent of the ORT format model to be easily viewed in Netron.`
			`optimized_target_path = re.sub(r'\.onnx$', '.optimized.onnx', model, flags=re.IGNORECASE)`
			`so = _create_session_options(optimization_level, optimized_target_path, custom_op_library)`

			`print("Saving optimized ONNX model {} to {}".format(model, optimized_target_path))`
Add NNAPI to providers that can be used via the python bindings. (#5867) Update ORT model conversion script - add args for specifying optimization level and whether to use NNAPI - add logic to create a list of required ops and ORT format model that can be used with NNAPI 2020-11-20 23:18:35 +00:00			`_ = ort.InferenceSession(model, sess_options=so, providers=providers)`

Update ORT model conversion script to support custom ops (#6701) * Add support for custom ops library to the ORT model conversion script Simplify model conversion now that we read ops from the ORT format model. Enable custom ops in the python bindings if custom ops are turned on in a minimal build. * Add test of model conversion involving custom ops. 2021-02-17 02:52:39 +00:00			`# Load ONNX model, optimize, and save to ORT format`
			`so = _create_session_options(optimization_level, ort_target_path, custom_op_library)`
			`so.add_session_config_entry('session.save_model_format', 'ORT')`

			`print("Converting optimized ONNX model to ORT format model {}".format(ort_target_path))`
			`_ = ort.InferenceSession(model, sess_options=so, providers=providers)`

			`# orig_size = os.path.getsize(onnx_target_path)`
			`# new_size = os.path.getsize(ort_target_path)`
			`# print("Serialized {} to {}. Sizes: orig={} new={} diff={} new:old={:.4f}:1.0".format(`
			`# onnx_target_path, ort_target_path, orig_size, new_size, new_size - orig_size, new_size / orig_size))`
Update conversion script and process to simplify creating ORT format models and a minimal build (#5217) * Update conversion script and process to simplify creating ORT format models and a minimal build. 2020-09-18 08:49:54 +00:00

Add NNAPI to providers that can be used via the python bindings. (#5867) Update ORT model conversion script - add args for specifying optimization level and whether to use NNAPI - add logic to create a list of required ops and ORT format model that can be used with NNAPI 2020-11-20 23:18:35 +00:00			`def _get_optimization_level(level):`
			`if level == 'disable':`
			`return ort.GraphOptimizationLevel.ORT_DISABLE_ALL`
			`if level == 'basic':`
			`# Constant folding and other optimizations that only use ONNX operators`
			`return ort.GraphOptimizationLevel.ORT_ENABLE_BASIC`
			`if level == 'extended':`
			`# Optimizations using custom operators, excluding NCHWc optimizations`
			`return ort.GraphOptimizationLevel.ORT_ENABLE_EXTENDED`
			`if level == 'all':`
			`# all optimizations, including NCHWc (which has hardware specific logic)`
Expand the documentation on using compiling EPs with a minimal build (#5893) * Expand the documentation on using compiling EPs with a minimal build to call out a 'simple' option that is easier to use. Provide more background on what happens to help users choose the best option for them. Tweak conversion script to be noisier about attempted usage of 'all' optimization level. Co-authored-by: manashgoswami <magoswam@microsoft.com> 2020-12-01 23:12:36 +00:00			`print('WARNING: Enabling layout optimizations is not recommended unless the ORT format model will be executed '`
			`'on the same hardware used to create the model.')`
Add NNAPI to providers that can be used via the python bindings. (#5867) Update ORT model conversion script - add args for specifying optimization level and whether to use NNAPI - add logic to create a list of required ops and ORT format model that can be used with NNAPI 2020-11-20 23:18:35 +00:00			`return ort.GraphOptimizationLevel.ORT_ENABLE_ALL`

			`raise ValueError('Invalid optimization level of ' + level)`


Update conversion script and process to simplify creating ORT format models and a minimal build (#5217) * Update conversion script and process to simplify creating ORT format models and a minimal build. 2020-09-18 08:49:54 +00:00			`def parse_args():`
			`parser = argparse.ArgumentParser(`
			`os.path.basename(__file__),`
			`description='''Convert the ONNX format model/s in the provided directory to ORT format models.`
			All files with a `.onnx` extension will be processed. For each one, an ORT format model will be created in the
			same directory. A configuration file will also be created called `required_operators.config`, and will contain
			`the list of required operators for all converted models.`
Add ability to track per operator types in reduced build config. (#6428) * Add ability to generate configuration that includes required types for individual operators, to allow build size reduction based on that. - Add python bindings for ORT format models - Add script to update bindings and help info - Add parsing of ORT format models - Add ability to enable type reduction to config generation - Update build.py to only allow operator/type reduction via config - simpler to require config to be generated first - can't mix a type aware (ORT format model only) and non-type aware config as that may result in insufficient types being enabled - Add script to create reduced build config - Update CIs 2021-01-28 21:59:51 +00:00			This configuration file should be used as input to the minimal build via the `--include_ops_by_config`
			`parameter.`
			`'''`
Update conversion script and process to simplify creating ORT format models and a minimal build (#5217) * Update conversion script and process to simplify creating ORT format models and a minimal build. 2020-09-18 08:49:54 +00:00			`)`

Add NNAPI to providers that can be used via the python bindings. (#5867) Update ORT model conversion script - add args for specifying optimization level and whether to use NNAPI - add logic to create a list of required ops and ORT format model that can be used with NNAPI 2020-11-20 23:18:35 +00:00			`parser.add_argument('--use_nnapi', action='store_true',`
			`help='Enable the NNAPI Execution Provider when creating models and determining required '`
			`'operators. Note that this will limit the optimizations possible on nodes that the '`
			`'NNAPI execution provider takes, in order to preserve those nodes in the ORT format '`
			`'model.')`

			`parser.add_argument('--optimization_level', default='extended',`
			`choices=['disable', 'basic', 'extended', 'all'],`
			`help="Level to optimize ONNX model with, prior to converting to ORT format model. "`
			`"These map to the onnxruntime.GraphOptimizationLevel values. "`
			`"NOTE: It is NOT recommended to use 'all' unless you are creating the ORT format model on "`
			`"the device you will run it on, as the generated model may not be valid on other hardware."`
			`)`

Add ability to track per operator types in reduced build config. (#6428) * Add ability to generate configuration that includes required types for individual operators, to allow build size reduction based on that. - Add python bindings for ORT format models - Add script to update bindings and help info - Add parsing of ORT format models - Add ability to enable type reduction to config generation - Update build.py to only allow operator/type reduction via config - simpler to require config to be generated first - can't mix a type aware (ORT format model only) and non-type aware config as that may result in insufficient types being enabled - Add script to create reduced build config - Update CIs 2021-01-28 21:59:51 +00:00			`parser.add_argument('--enable_type_reduction', action='store_true',`
			`help='Add operator specific type information to the configuration file to potentially reduce '`
			`'the types supported by individual operator implementations.')`

Update ORT model conversion script to support custom ops (#6701) * Add support for custom ops library to the ORT model conversion script Simplify model conversion now that we read ops from the ORT format model. Enable custom ops in the python bindings if custom ops are turned on in a minimal build. * Add test of model conversion involving custom ops. 2021-02-17 02:52:39 +00:00			`parser.add_argument('--custom_op_library', type=pathlib.Path, default=None,`
			`help='Provide path to shared library containing custom operator kernels to register.')`

			`parser.add_argument('--save_optimized_onnx_model', action='store_true',`
			`help='Save the optimized version of each ONNX model. '`
			`'This will have the same optimizations applied as the ORT format model.')`

			`parser.add_argument('model_path', type=pathlib.Path,`
			`help='Provide path to directory containing ONNX model/s to convert. '`
			`'All files with a .onnx extension, including in subdirectories, will be processed.')`
Add NNAPI to providers that can be used via the python bindings. (#5867) Update ORT model conversion script - add args for specifying optimization level and whether to use NNAPI - add logic to create a list of required ops and ORT format model that can be used with NNAPI 2020-11-20 23:18:35 +00:00
Update conversion script and process to simplify creating ORT format models and a minimal build (#5217) * Update conversion script and process to simplify creating ORT format models and a minimal build. 2020-09-18 08:49:54 +00:00			`return parser.parse_args()`


			`def main():`
			`args = parse_args()`
Update ORT model conversion script to support custom ops (#6701) * Add support for custom ops library to the ORT model conversion script Simplify model conversion now that we read ops from the ORT format model. Enable custom ops in the python bindings if custom ops are turned on in a minimal build. * Add test of model conversion involving custom ops. 2021-02-17 02:52:39 +00:00
			`model_path = args.model_path.resolve()`
			`custom_op_library = args.custom_op_library.resolve() if args.custom_op_library else None`

			`if not model_path.is_dir():`
			`raise FileNotFoundError('Model path {} is not a directory.'.format(model_path))`

			`if custom_op_library and not custom_op_library.is_file():`
			`raise FileNotFoundError("Unable to find custom operator library '{}'".format(custom_op_library))`

Add NNAPI to providers that can be used via the python bindings. (#5867) Update ORT model conversion script - add args for specifying optimization level and whether to use NNAPI - add logic to create a list of required ops and ORT format model that can be used with NNAPI 2020-11-20 23:18:35 +00:00			`optimization_level = _get_optimization_level(args.optimization_level)`
Update ORT model conversion script to support custom ops (#6701) * Add support for custom ops library to the ORT model conversion script Simplify model conversion now that we read ops from the ORT format model. Enable custom ops in the python bindings if custom ops are turned on in a minimal build. * Add test of model conversion involving custom ops. 2021-02-17 02:52:39 +00:00			`_convert(model_path, optimization_level, args.use_nnapi, custom_op_library, args.save_optimized_onnx_model)`
			`_create_config_file_from_ort_models(model_path, args.enable_type_reduction)`
Update conversion script and process to simplify creating ORT format models and a minimal build (#5217) * Update conversion script and process to simplify creating ORT format models and a minimal build. 2020-09-18 08:49:54 +00:00

			`if __name__ == '__main__':`
			`main()`