Skip to content

Commit 50648c7

Browse files
bug fix
Signed-off-by: cliu-us <[email protected]>
1 parent a8d6ea9 commit 50648c7

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

fms_mo/custom_ext_kernels/triton_kernels.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -184,7 +184,7 @@ def matmul_kernel(
184184
if chunk_trun_bits > 0:
185185
accumulator_inner = round_and_trun(accumulator_inner, round_bit, trun_mask)
186186
if clamp_acc_to_dl16:
187-
accumulator = fp32_clamp_to_dl16(accumulator)
187+
accumulator_inner = fp32_clamp_to_dl16(accumulator_inner)
188188
## ---------------------------------------------------------
189189
if truncate_then_accumulate:
190190
accumulator += accumulator_inner
@@ -411,7 +411,7 @@ def matmul_kernel_DABC(
411411
if chunk_trun_bits > 0:
412412
accumulator_inner = round_and_trun(accumulator_inner, round_bit, trun_mask)
413413
if clamp_acc_to_dl16:
414-
accumulator = fp32_clamp_to_dl16(accumulator)
414+
accumulator_inner = fp32_clamp_to_dl16(accumulator_inner)
415415
## ---------------------------------------------------------
416416
if truncate_then_accumulate:
417417
accumulator += accumulator_inner

0 commit comments

Comments
 (0)