Skip to content

Commit bb14aa5

Browse files
authored
[autoWS] use minRegAutoWS and maxRegAutoWS in autotune config (#530)
1 parent 5d05cb9 commit bb14aa5

File tree

1 file changed

+4
-0
lines changed

1 file changed

+4
-0
lines changed

tritonbench/kernels/blackwell_triton_fused_attention_dp.py

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -210,6 +210,8 @@ def _host_descriptor_pre_hook(nargs):
210210
"VECT_MUL": vectmul,
211211
},
212212
pre_hook=_host_descriptor_pre_hook,
213+
minRegAutoWS=24,
214+
maxRegAutoWS=152,
213215
)
214216
for BM in [64, 128, 256]
215217
for BN in [64, 128]
@@ -224,6 +226,8 @@ def _host_descriptor_pre_hook(nargs):
224226
num_stages=s,
225227
num_warps=w,
226228
pre_hook=_host_descriptor_pre_hook,
229+
minRegAutoWS=24,
230+
maxRegAutoWS=152,
227231
# ir_override=f"override/_attn_fwd_persist.ttgir"
228232
)
229233
for BM in [256]

0 commit comments

Comments
 (0)