mirror of
https://github.com/saymrwulf/onnxruntime.git
synced 2026-06-26 03:00:54 +00:00
temporarily disable weight/Bias quantization
This commit is contained in:
parent
bbb5862b9e
commit
981d95b81e
1 changed files with 1 additions and 1 deletions
|
|
@ -249,7 +249,7 @@ InlinedVector<std::unique_ptr<GraphTransformer>> GenerateTransformers(
|
|||
|
||||
if (!disable_quant_qdq) {
|
||||
transformers.emplace_back(std::make_unique<QDQPropagationTransformer>());
|
||||
transformers.emplace_back(std::make_unique<WeightBiasQuantization>());
|
||||
//transformers.emplace_back(std::make_unique<WeightBiasQuantization>());
|
||||
|
||||
// EnsureUniqueDQForNodeUnit is actually a required graph transformation. The unique DQ per QDQ node unit input
|
||||
// condition that it ensures is important for the partitioning that happens after Level1 optimizers are run.
|
||||
|
|
|
|||
Loading…
Reference in a new issue