mirror of
https://github.com/saymrwulf/onnxruntime.git
synced 2026-06-03 23:49:44 +00:00
Fix typos
This commit is contained in:
parent
5216a43c9d
commit
c2b4054c74
7 changed files with 9 additions and 9 deletions
|
|
@ -663,7 +663,7 @@
|
|||
"Graph pruned: 0 inputs, 0 outputs and 312 nodes are removed\n",
|
||||
"postprocess: remove Reshape count:48\n",
|
||||
"Fused FastGelu(add bias) count: 12\n",
|
||||
"opset verion: 11\n",
|
||||
"opset version: 11\n",
|
||||
"Output model to .\\onnx_models\\gpt2_past_fp32.onnx\n",
|
||||
"batch_size=1, past_sequence_length=8, torch_latency=40.68, ort_latency=24.07, ort_io_latency=24.03\n",
|
||||
"batch_size=1, past_sequence_length=16, torch_latency=40.87, ort_latency=23.14, ort_io_latency=22.27\n",
|
||||
|
|
@ -731,7 +731,7 @@
|
|||
"Graph pruned: 0 inputs, 0 outputs and 312 nodes are removed\n",
|
||||
"postprocess: remove Reshape count:48\n",
|
||||
"Fused FastGelu(add bias) count: 12\n",
|
||||
"opset verion: 11\n",
|
||||
"opset version: 11\n",
|
||||
"Output model to .\\onnx_models\\gpt2_past_int8.onnx\n",
|
||||
"quantizing model...\n",
|
||||
"Size of full precision ONNX model(MB):621.9615631103516\n",
|
||||
|
|
|
|||
|
|
@ -434,7 +434,7 @@
|
|||
" prune_graph: Graph pruned: 0 inputs, 0 outputs and 0 nodes are removed\n",
|
||||
" apply: Fused BiasGelu count: 12\n",
|
||||
" apply: Fused SkipLayerNormalization(add bias) count: 24\n",
|
||||
" optimize: opset verion: 11\n",
|
||||
" optimize: opset version: 11\n",
|
||||
" save_model_to_file: Sort graphs in topological order\n",
|
||||
" save_model_to_file: Output model to ..\\onnx_models\\bert-base-cased-squad_opt_cpu.onnx\n",
|
||||
"get_fused_operator_statistics: Optimized operators:{'EmbedLayerNormalization': 1, 'Attention': 12, 'Gelu': 0, 'FastGelu': 0, 'BiasGelu': 12, 'LayerNormalization': 0, 'SkipLayerNormalization': 24}\n",
|
||||
|
|
|
|||
|
|
@ -661,7 +661,7 @@
|
|||
" prune_graph: Graph pruned: 0 inputs, 0 outputs and 0 nodes are removed\n",
|
||||
" apply: Fused BiasGelu count: 24\n",
|
||||
" apply: Fused SkipLayerNormalization(add bias) count: 48\n",
|
||||
" optimize: opset verion: 11\n",
|
||||
" optimize: opset version: 11\n",
|
||||
" save_model_to_file: Sort graphs in topological order\n",
|
||||
" save_model_to_file: Output model to ./onnx/bert-base-cased-squad_opt_gpu_fp32.onnx\n",
|
||||
"get_fused_operator_statistics: Optimized operators:{'EmbedLayerNormalization': 1, 'Attention': 24, 'Gelu': 0, 'FastGelu': 0, 'BiasGelu': 24, 'LayerNormalization': 0, 'SkipLayerNormalization': 48}\n",
|
||||
|
|
@ -939,7 +939,7 @@
|
|||
" prune_graph: Graph pruned: 0 inputs, 0 outputs and 0 nodes are removed\n",
|
||||
" apply: Fused BiasGelu count: 24\n",
|
||||
" apply: Fused SkipLayerNormalization(add bias) count: 48\n",
|
||||
" optimize: opset verion: 11\n",
|
||||
" optimize: opset version: 11\n",
|
||||
" save_model_to_file: Sort graphs in topological order\n",
|
||||
" save_model_to_file: Output model to ./onnx/bert-base-cased-squad_opt_gpu_fp16.onnx\n",
|
||||
"get_fused_operator_statistics: Optimized operators:{'EmbedLayerNormalization': 1, 'Attention': 24, 'Gelu': 0, 'FastGelu': 0, 'BiasGelu': 24, 'LayerNormalization': 0, 'SkipLayerNormalization': 48}\n",
|
||||
|
|
|
|||
|
|
@ -350,7 +350,7 @@ class BertOnnxModel(OnnxModel):
|
|||
if add_dynamic_axes:
|
||||
self.use_dynamic_axes()
|
||||
|
||||
logger.info(f"opset verion: {self.get_opset_version()}")
|
||||
logger.info(f"opset version: {self.get_opset_version()}")
|
||||
|
||||
def get_fused_operator_statistics(self):
|
||||
"""
|
||||
|
|
|
|||
|
|
@ -102,7 +102,7 @@ TEST(SchemaRegistryManager, OpsetRegTest) {
|
|||
ASSERT_TRUE(manager.GetSchema("Op2", 1, "Domain1")->since_version() == 1);
|
||||
ASSERT_TRUE(manager.GetSchema("Op2", 2, "Domain1")->since_version() == 1);
|
||||
|
||||
// Add a new operator set which is verion 5, with a baseline of version 4, meaning that
|
||||
// Add a new operator set which is version 5, with a baseline of version 4, meaning that
|
||||
// there is a gap at version 3.
|
||||
std::shared_ptr<onnxruntime::OnnxRuntimeOpSchemaRegistry> registryV5 = std::make_shared<OnnxRuntimeOpSchemaRegistry>();
|
||||
manager.RegisterRegistry(registryV5);
|
||||
|
|
|
|||
|
|
@ -316,7 +316,7 @@ def main():
|
|||
bert_model.update_graph()
|
||||
bert_model.remove_unused_constant()
|
||||
|
||||
print("opset verion", bert_model.model.opset_import[0].version)
|
||||
print("opset version", bert_model.model.opset_import[0].version)
|
||||
|
||||
with open(args.output, "wb") as out:
|
||||
out.write(bert_model.model.SerializeToString())
|
||||
|
|
|
|||
|
|
@ -344,7 +344,7 @@ def main():
|
|||
bert_model.update_graph()
|
||||
bert_model.remove_unused_constant()
|
||||
|
||||
print("opset verion", bert_model.model.opset_import[0].version)
|
||||
print("opset version", bert_model.model.opset_import[0].version)
|
||||
|
||||
with open(args.output, "wb") as out:
|
||||
out.write(bert_model.model.SerializeToString())
|
||||
|
|
|
|||
Loading…
Reference in a new issue