We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 5d05cb9 commit bb14aa5Copy full SHA for bb14aa5
tritonbench/kernels/blackwell_triton_fused_attention_dp.py
@@ -210,6 +210,8 @@ def _host_descriptor_pre_hook(nargs):
210
"VECT_MUL": vectmul,
211
},
212
pre_hook=_host_descriptor_pre_hook,
213
+ minRegAutoWS=24,
214
+ maxRegAutoWS=152,
215
)
216
for BM in [64, 128, 256]
217
for BN in [64, 128]
@@ -224,6 +226,8 @@ def _host_descriptor_pre_hook(nargs):
224
226
num_stages=s,
225
227
num_warps=w,
228
229
230
231
# ir_override=f"override/_attn_fwd_persist.ttgir"
232
233
for BM in [256]
0 commit comments