From 61ba5b501a18ce6ac074cf39132a30fd05487398 Mon Sep 17 00:00:00 2001
From: Yufeng Li <liyufeng1987@gmail.com>
Date: Wed, 23 Sep 2020 08:47:20 -0700
Subject: [PATCH] Fix bug in the back to back quantization of matmul and conv
 (#5264)

* fix bug in the back to back quantization of matmul and conv

* fix bug in back to back gather
---
 onnxruntime/python/tools/quantization/onnx_model.py       | 2 +-
 onnxruntime/python/tools/quantization/operators/conv.py   | 2 +-
 onnxruntime/python/tools/quantization/operators/gather.py | 2 +-
 onnxruntime/python/tools/quantization/operators/matmul.py | 2 +-
 4 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/onnxruntime/python/tools/quantization/onnx_model.py b/onnxruntime/python/tools/quantization/onnx_model.py
index 2d6b209326..72ff56ea89 100644
--- a/onnxruntime/python/tools/quantization/onnx_model.py
+++ b/onnxruntime/python/tools/quantization/onnx_model.py
@@ -127,7 +127,7 @@ class ONNXModel:
                     nodes.append(node)
         return nodes
     
-     def save_model_to_file(self, output_path, use_external_data_format=False):
+    def save_model_to_file(self, output_path, use_external_data_format=False):
         '''
         Save model to external data, which is needed for model size > 2GB
         '''
diff --git a/onnxruntime/python/tools/quantization/operators/conv.py b/onnxruntime/python/tools/quantization/operators/conv.py
index 2c771ccea5..4ab79f241e 100644
--- a/onnxruntime/python/tools/quantization/operators/conv.py
+++ b/onnxruntime/python/tools/quantization/operators/conv.py
@@ -22,7 +22,7 @@ class ConvInteger(QuantOperatorBase):
             quantized_bias_name = self.quantizer.quantize_bias(node, nodes)
             bias_present = True
 
-        conv_integer_output = node.output[0] + "_quantized"
+        conv_integer_output = node.output[0] + "_output_quantized"
         conv_integer_name = node.name + "_quant" if node.name != "" else ""
 
         kwargs = {}
diff --git a/onnxruntime/python/tools/quantization/operators/gather.py b/onnxruntime/python/tools/quantization/operators/gather.py
index 9f9595775b..35830a46ad 100644
--- a/onnxruntime/python/tools/quantization/operators/gather.py
+++ b/onnxruntime/python/tools/quantization/operators/gather.py
@@ -15,7 +15,7 @@ class GatherQuant(QuantOperatorBase):
         node = self.node
         assert (node.op_type == "Gather")
         if (not self.quantizer._is_valid_quantize_weight(node.input[0])):
-            self.quantizer.new_nodes += [node]
+            super().quantize()
             return
 
         (quantized_input_names, zero_point_names, scale_names, nodes) = \
diff --git a/onnxruntime/python/tools/quantization/operators/matmul.py b/onnxruntime/python/tools/quantization/operators/matmul.py
index d765a043e1..d7a91f3577 100644
--- a/onnxruntime/python/tools/quantization/operators/matmul.py
+++ b/onnxruntime/python/tools/quantization/operators/matmul.py
@@ -18,7 +18,7 @@ class MatMulInteger(QuantOperatorBase):
         (quantized_input_names, zero_point_names, scale_names, nodes) = \
             self.quantizer.quantize_inputs(node, [0, 1])
 
-        matmul_integer_output = node.output[0] + "_quantized"
+        matmul_integer_output = node.output[0] + "_output_quantized"
         matmul_integer_name = node.name + "_quant" if node.name != "" else ""
         matmul_integer_node = onnx.helper.make_node("MatMulInteger", quantized_input_names + zero_point_names,
                                                     [matmul_integer_output], matmul_integer_name)