temporarily disable weight/Bias quantization

This commit is contained in:
Chi Lo 2025-01-22 10:15:16 -08:00
parent bbb5862b9e
commit 981d95b81e

View file

@ -249,7 +249,7 @@ InlinedVector<std::unique_ptr<GraphTransformer>> GenerateTransformers(
if (!disable_quant_qdq) {
transformers.emplace_back(std::make_unique<QDQPropagationTransformer>());
transformers.emplace_back(std::make_unique<WeightBiasQuantization>());
//transformers.emplace_back(std::make_unique<WeightBiasQuantization>());
// EnsureUniqueDQForNodeUnit is actually a required graph transformation. The unique DQ per QDQ node unit input
// condition that it ensures is important for the partitioning that happens after Level1 optimizers are run.