mirror of
https://github.com/saymrwulf/onnxruntime.git
synced 2026-06-06 00:03:22 +00:00
Fix PoliCheck (#18180)
Fix PoliCheck by changing some words, which was from Triton flash attention's original code.
This commit is contained in:
parent
08dce54266
commit
1c25fe5580
1 changed files with 1 additions and 1 deletions
|
|
@ -393,7 +393,7 @@ def _bwd_kernel_one_col_block(
|
|||
dk = tl.zeros([BLOCK_N, BLOCK_HEADDIM], dtype=tl.float32)
|
||||
# There seems to be some problem with Triton pipelining that makes results wrong for
|
||||
# headdim=64, seqlen=(113, 255), bias_type='matrix'. In this case the for loop
|
||||
# may have zero step, and pipelining with the bias matrix could screw it up.
|
||||
# may have zero step, and pipelining with the bias matrix could cause the problem.
|
||||
# So we just exit early.
|
||||
if begin_m >= seqlen_q:
|
||||
dv_ptrs = DV + (offs_n[:, None] * stride_dvn + offs_d[None, :])
|
||||
|
|
|
|||
Loading…
Reference in a new issue