mirror of
https://github.com/saymrwulf/onnxruntime.git
synced 2026-05-14 20:48:00 +00:00
works
This commit is contained in:
parent
0a0a5ca7a8
commit
d2876b84f1
1 changed files with 1 additions and 1 deletions
|
|
@ -60,7 +60,7 @@ class MatMulNBits final : public WebGpuKernel {
|
|||
N_ = info.GetAttr<int64_t>("N");
|
||||
block_size_ = info.GetAttr<int64_t>("block_size");
|
||||
int64_t bits = info.GetAttr<int64_t>("bits");
|
||||
accuracy_level_ = info.GetAttrOrDefault<int64_t>("accuracy_level", 4);
|
||||
accuracy_level_ = 4; // info.GetAttrOrDefault<int64_t>("accuracy_level", 4);
|
||||
ORT_ENFORCE(bits == 4,
|
||||
"Only 4b quantization is supported for MatMulNBits op, additional bits support is planned.");
|
||||
}
|
||||
|
|
|
|||
Loading…
Reference in a new issue