We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent e85b4f6 commit 4098dcfCopy full SHA for 4098dcf
benchmarks/triton_kernels_benchmark/benchmark_testing.py
@@ -159,8 +159,7 @@ def extract_kernels(funcs):
159
# for correct registration of kernels.
160
# For details: https://github.com/pytorch/pytorch/issues/144778
161
kernels = [kernel for kernel in kernels if kernel != []]
162
- # FIXME: relaxation for new agama release
163
- assert len(kernels) >= n_repeat - 1, (
+ assert len(kernels) == n_repeat, (
164
f"the profiling number not match; {n_repeat=}, {kernels=}, \n" +
165
f"top functions by xpu_time:\n {prof.key_averages(group_by_stack_n=5).table(sort_by='xpu_time')}")
166
# Make the time to the milliseconds.
0 commit comments