We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 23c0169 commit 810c0acCopy full SHA for 810c0ac
tritonbench/operators/launch_latency/operator.py
@@ -1,6 +1,8 @@
1
import triton.language as tl
2
from torch import zeros
3
from torch._C import _cuda_getCurrentRawStream as get_raw_stream
4
+
5
+from torch._inductor.utils import triton_version_uses_attrs_dict
6
from triton.compiler import CompiledKernel
7
8
from tritonbench.utils.triton_op import (
@@ -10,7 +12,6 @@
10
12
register_metric,
11
13
)
14
-from torch._inductor.utils import triton_version_uses_attrs_dict
15
from .kernels import get_trivial_add_kernel, nop_kernel, nop_with_args_kernel
16
17
0 commit comments