mirror of
https://github.com/saymrwulf/onnxruntime.git
synced 2026-05-28 22:56:32 +00:00
Fix bug in Attention Fusion (#13050)
This commit is contained in:
parent
cccbe90764
commit
057567f39f
1 changed files with 1 additions and 1 deletions
|
|
@ -242,7 +242,7 @@ class FusionAttention(Fusion):
|
|||
# For 2d weights, the shapes would be [in_size, out_size].
|
||||
# For 3d weights, shape would be [in_size, a, b] where a*b = out_size
|
||||
qw_out_size = np.prod(qw.shape[1:])
|
||||
kw_out_size = np.prod(qw.shape[1:])
|
||||
kw_out_size = np.prod(kw.shape[1:])
|
||||
vw_out_size = np.prod(vw.shape[1:])
|
||||
|
||||
qkv_weight_dim = 0
|
||||
|
|
|
|||
Loading…
Reference in a new issue