onnxruntime/onnxruntime/test/python/quantization/test_op_maxpool.py

#!/usr/bin/env python
# coding: utf-8
# -------------------------------------------------------------------------
# Copyright (c) Microsoft Corporation. All rights reserved.
# Licensed under the MIT License. See License.txt in the project root for
# license information.
# --------------------------------------------------------------------------

import unittest
import onnx
import numpy as np
from onnx import helper, TensorProto
from onnxruntime.quantization import quantize_static, QuantFormat
from op_test_utils import TestDataFeeds, check_model_correctness, check_op_type_count, check_op_nodes


class TestOpMaxPool(unittest.TestCase):
    def input_feeds(self, n, name2shape):
        input_data_list = []
        for i in range(n):
            inputs = {}
            for name, shape in name2shape.items():
                inputs.update({name: np.random.randint(-1, 2, shape).astype(np.float32)})
            input_data_list.extend([inputs])
        dr = TestDataFeeds(input_data_list)
        return dr

    def construct_model_conv_maxpool(self, output_model_path,
                                     conv_input_shape, conv_weight_shape,
                                     maxpool_input_shape, maxpool_attributes,
                                     output_shape,
                                     ):
        #      (input)
        #          \
        #         Conv
        #        /    \
        #   Identity   MaxPool
        #    /            \
        # (identity_out)  (output)
        input_tensor = helper.make_tensor_value_info('input', TensorProto.FLOAT, conv_input_shape)

        conv_weight_arr = np.random.randint(-1, 2, conv_weight_shape).astype(np.float32)
        conv_weight_initializer = onnx.numpy_helper.from_array(conv_weight_arr, name='conv1_weight')
        conv_node = onnx.helper.make_node('Conv', ['input', 'conv1_weight'], ['conv_output'], name='conv_node')

        identity_out = helper.make_tensor_value_info('identity_out', TensorProto.FLOAT, maxpool_input_shape)
        identity_node = helper.make_node('Identity', ['conv_output'], ['identity_out'], name='IdentityNode')

        initializers = [conv_weight_initializer]

        output_tensor = helper.make_tensor_value_info('output', TensorProto.FLOAT, output_shape)
        maxpool_node = helper.make_node('MaxPool', ['conv_output'], ['output'], name='maxpool_node', **maxpool_attributes)

        graph = helper.make_graph([conv_node, identity_node, maxpool_node], 'TestOpQuantizerMaxPool_test_model',
                                  [input_tensor], [identity_out, output_tensor], initializer=initializers)
        model = helper.make_model(graph, opset_imports=[helper.make_opsetid("", 12)])
        model.ir_version = 7 # use stable onnx ir version
        onnx.save(model, output_model_path)

    def test_quantize_maxpool(self):
        np.random.seed(1)

        model_fp32_path = 'maxpool_fp32.onnx'
        model_uint8_path = 'maxpool_uint8.onnx'
        model_uint8_qdq_path = 'maxpool_uint8_qdq.onnx'

        self.construct_model_conv_maxpool(model_fp32_path,
                                          [1, 2, 26, 42], [3, 2, 3, 3],
                                          [1, 3, 24, 40], {'kernel_shape': [3, 3]},
                                          [1, 3, 22, 38])

        # Verify QOperator mode
        data_reader = self.input_feeds(1, {'input': [1, 2, 26, 42]})
        quantize_static(model_fp32_path, model_uint8_path, data_reader)

        # make sure maxpool become xint8 operator, its input name could tell that
        check_op_nodes(self, model_uint8_path, lambda node: (node.name != "maxpool_node" or node.input[0] != 'conv_output'))
        qnode_counts = {'QLinearConv': 1, 'QuantizeLinear': 1, 'DequantizeLinear': 2, 'MaxPool': 1}
        check_op_type_count(self, model_uint8_path, **qnode_counts)
        data_reader.rewind()
        check_model_correctness(self, model_fp32_path, model_uint8_path, data_reader.get_next())

        # Verify QDQ mode
        data_reader.rewind()
        quantize_static(model_fp32_path, model_uint8_qdq_path, data_reader, quant_format=QuantFormat.QDQ)
        qdqnode_counts = {'Conv': 1, 'QuantizeLinear': 2, 'DequantizeLinear': 3, 'MaxPool': 1}
        check_op_type_count(self, model_uint8_qdq_path, **qdqnode_counts)
        data_reader.rewind()
        check_model_correctness(self, model_fp32_path, model_uint8_qdq_path, data_reader.get_next())


if __name__ == '__main__':
    unittest.main()
Support transpose by merge Reshape etc into direct xint8 operators. (#7265) * Suppose transpose by merge Reshape etc into direct xint8 operators. * Add resize operator quantization support * Add QDQ tests for resize, reshape, maxpool, transpose. 2021-04-09 01:00:35 +00:00			`#!/usr/bin/env python`
			`# coding: utf-8`
			`# -------------------------------------------------------------------------`
			`# Copyright (c) Microsoft Corporation. All rights reserved.`
			`# Licensed under the MIT License. See License.txt in the project root for`
			`# license information.`
			`# --------------------------------------------------------------------------`

			`import unittest`
			`import onnx`
			`import numpy as np`
			`from onnx import helper, TensorProto`
			`from onnxruntime.quantization import quantize_static, QuantFormat`
			`from op_test_utils import TestDataFeeds, check_model_correctness, check_op_type_count, check_op_nodes`


			`class TestOpMaxPool(unittest.TestCase):`
			`def input_feeds(self, n, name2shape):`
			`input_data_list = []`
			`for i in range(n):`
			`inputs = {}`
			`for name, shape in name2shape.items():`
			`inputs.update({name: np.random.randint(-1, 2, shape).astype(np.float32)})`
			`input_data_list.extend([inputs])`
			`dr = TestDataFeeds(input_data_list)`
			`return dr`

			`def construct_model_conv_maxpool(self, output_model_path,`
			`conv_input_shape, conv_weight_shape,`
			`maxpool_input_shape, maxpool_attributes,`
			`output_shape,`
			`):`
			`# (input)`
			`# \`
			`# Conv`
			`# / \`
			`# Identity MaxPool`
			`# / \`
			`# (identity_out) (output)`
			`input_tensor = helper.make_tensor_value_info('input', TensorProto.FLOAT, conv_input_shape)`

			`conv_weight_arr = np.random.randint(-1, 2, conv_weight_shape).astype(np.float32)`
			`conv_weight_initializer = onnx.numpy_helper.from_array(conv_weight_arr, name='conv1_weight')`
			`conv_node = onnx.helper.make_node('Conv', ['input', 'conv1_weight'], ['conv_output'], name='conv_node')`

			`identity_out = helper.make_tensor_value_info('identity_out', TensorProto.FLOAT, maxpool_input_shape)`
			`identity_node = helper.make_node('Identity', ['conv_output'], ['identity_out'], name='IdentityNode')`

			`initializers = [conv_weight_initializer]`

			`output_tensor = helper.make_tensor_value_info('output', TensorProto.FLOAT, output_shape)`
			`maxpool_node = helper.make_node('MaxPool', ['conv_output'], ['output'], name='maxpool_node', **maxpool_attributes)`

			`graph = helper.make_graph([conv_node, identity_node, maxpool_node], 'TestOpQuantizerMaxPool_test_model',`
			`[input_tensor], [identity_out, output_tensor], initializer=initializers)`
			`model = helper.make_model(graph, opset_imports=[helper.make_opsetid("", 12)])`
use stable onnx.ir_version in test (#7747) 2021-05-19 03:14:57 +00:00			`model.ir_version = 7 # use stable onnx ir version`
Support transpose by merge Reshape etc into direct xint8 operators. (#7265) * Suppose transpose by merge Reshape etc into direct xint8 operators. * Add resize operator quantization support * Add QDQ tests for resize, reshape, maxpool, transpose. 2021-04-09 01:00:35 +00:00			`onnx.save(model, output_model_path)`

			`def test_quantize_maxpool(self):`
			`np.random.seed(1)`

			`model_fp32_path = 'maxpool_fp32.onnx'`
			`model_uint8_path = 'maxpool_uint8.onnx'`
			`model_uint8_qdq_path = 'maxpool_uint8_qdq.onnx'`

			`self.construct_model_conv_maxpool(model_fp32_path,`
			`[1, 2, 26, 42], [3, 2, 3, 3],`
			`[1, 3, 24, 40], {'kernel_shape': [3, 3]},`
			`[1, 3, 22, 38])`

			`# Verify QOperator mode`
			`data_reader = self.input_feeds(1, {'input': [1, 2, 26, 42]})`
			`quantize_static(model_fp32_path, model_uint8_path, data_reader)`

			`# make sure maxpool become xint8 operator, its input name could tell that`
			`check_op_nodes(self, model_uint8_path, lambda node: (node.name != "maxpool_node" or node.input[0] != 'conv_output'))`
			`qnode_counts = {'QLinearConv': 1, 'QuantizeLinear': 1, 'DequantizeLinear': 2, 'MaxPool': 1}`
			`check_op_type_count(self, model_uint8_path, **qnode_counts)`
			`data_reader.rewind()`
			`check_model_correctness(self, model_fp32_path, model_uint8_path, data_reader.get_next())`

			`# Verify QDQ mode`
			`data_reader.rewind()`
			`quantize_static(model_fp32_path, model_uint8_qdq_path, data_reader, quant_format=QuantFormat.QDQ)`
			`qdqnode_counts = {'Conv': 1, 'QuantizeLinear': 2, 'DequantizeLinear': 3, 'MaxPool': 1}`
			`check_op_type_count(self, model_uint8_qdq_path, **qdqnode_counts)`
			`data_reader.rewind()`
			`check_model_correctness(self, model_fp32_path, model_uint8_qdq_path, data_reader.get_next())`


			`if __name__ == '__main__':`
			`unittest.main()`