Get onnxruntime/core/providers/cuda/math/matmul_integer.cc from ort_training.

2026-07-21 19:18:55 +00:00 · 2020-04-09 18:09:46 -07:00 · 2020-04-09 18:09:46 -07:00 · 507d2bb9b9
commit 507d2bb9b9
parent 1b465ba820
1 changed files with 0 additions and 23 deletions
--- a/onnxruntime/core/providers/cuda/math/matmul_integer.cc
+++ b/onnxruntime/core/providers/cuda/math/matmul_integer.cc
@ -6,7 +6,6 @@
 #include "core/providers/cpu/math/matmul_helper.h"
 #include "core/providers/cuda/shared_inc/fpgeneric.h"
 #include "core/providers/cuda/cuda_allocator.h"
-#include "core/providers/cuda/igemm.h"
 #include "core/providers/common.h"

 namespace onnxruntime {
@ -107,28 +106,6 @@ Status MatMulInteger<int8_t, int8_t>::ComputeInternal(OpKernelContext* ctx) cons
    beta = 1;
  }

-#if CUDA_VERSION >= 10010
-  if (DeviceProp::GetDeviceProps().major >= 7 && DeviceProp::GetDeviceProps().minor >= 5) {
-    for (size_t batch = 0; batch < helper.OutputOffsets().size(); batch++) {
-      LtIgemmTensor(
-          static_cast<int>(helper.M()),
-          static_cast<int>(helper.N()),
-          static_cast<int>(helper.K()),
-          alpha,
-          beta,
-          a_ptr + helper.LeftOffsets()[batch],
-          static_cast<int>(helper.K()),
-          b_ptr + helper.RightOffsets()[batch],
-          static_cast<int>(helper.N()),
-          output_ptr + helper.OutputOffsets()[batch],
-          static_cast<int>(helper.N()),
-          this,
-          Base::CublasLtHandle());
-    }
-    return Status::OK();
-  }
-#endif
-
  // pad A and B to make their leading dimension be multiples of 32
  // because cublasGemmEx requires:
  // 1. leading dimension is multiples of 4