diff --git a/onnxruntime/contrib_ops/cpu/quantization/qlinear_softmax.cc b/onnxruntime/contrib_ops/cpu/quantization/qlinear_softmax.cc index 70b6e674df..ed6071b40f 100644 --- a/onnxruntime/contrib_ops/cpu/quantization/qlinear_softmax.cc +++ b/onnxruntime/contrib_ops/cpu/quantization/qlinear_softmax.cc @@ -147,9 +147,9 @@ common::Status QlinearSoftmaxCPU(size_t N, ThreadPool::TryParallelFor( thread_pool, N, // Read 3*N (max,sum,div) write N (div), computation=Read - TensorOpCost{static_cast(D * 3), + TensorOpCost{static_cast(D) * 3.0, static_cast(D), - static_cast(D * 3)}, + static_cast(D) * 3.0}, [x_data, y_data, D, y_scale, yzp, &lookup_table](std::ptrdiff_t first, std::ptrdiff_t last) { const auto c_y_scale = y_scale; const auto c_y_zp = yzp;