|
29 | 29 | # Can map to a single kernel or a list of kernel variants
|
30 | 30 | KERNEL_MAPPINGS: dict[str, tuple[str, str, str] | tuple[str, list[tuple[str, str]]]] = {
|
31 | 31 | # <tritonbench_op_name>: (<tritonbench_module_path>, <helion_kernel_module_path>, <helion_kernel_function_name>)
|
32 |
| - "vector_add": ("tritonbench.operators.vector_add.operator", "examples.add", "add"), |
33 |
| - "embedding": ( |
34 |
| - "tritonbench.operators.embedding.operator", |
35 |
| - "examples.embedding", |
36 |
| - "embedding_tritonbench", |
37 |
| - ), |
38 |
| - "vector_exp": ( |
39 |
| - "tritonbench.operators.vector_exp.operator", |
40 |
| - "examples.exp", |
41 |
| - "exp_tritonbench", |
42 |
| - ), |
43 |
| - "rms_norm": ( |
44 |
| - "tritonbench.operators.rms_norm.operator", |
45 |
| - "examples.rms_norm", |
46 |
| - "rms_norm_tritonbench", |
47 |
| - ), |
48 |
| - "sum": ("tritonbench.operators.sum.operator", "examples.sum", "sum_tritonbench"), |
49 |
| - "softmax": ( |
50 |
| - "tritonbench.operators.softmax.operator", |
51 |
| - "examples.softmax", |
52 |
| - "softmax", |
53 |
| - ), |
54 |
| - "jagged_mean": ( |
55 |
| - "tritonbench.operators.jagged_mean.operator", |
56 |
| - "examples.jagged_mean", |
57 |
| - "jagged_mean_tritonbench", |
58 |
| - ), |
59 |
| - "fp8_gemm": ( |
60 |
| - "tritonbench.operators.fp8_gemm.fp8_gemm", |
61 |
| - "examples.fp8_gemm", |
62 |
| - "fp8_gemm_tritonbench", |
| 32 | + # "vector_add": ("tritonbench.operators.vector_add.operator", "examples.add", "add"), |
| 33 | + # "embedding": ( |
| 34 | + # "tritonbench.operators.embedding.operator", |
| 35 | + # "examples.embedding", |
| 36 | + # "embedding_tritonbench", |
| 37 | + # ), |
| 38 | + # "vector_exp": ( |
| 39 | + # "tritonbench.operators.vector_exp.operator", |
| 40 | + # "examples.exp", |
| 41 | + # "exp_tritonbench", |
| 42 | + # ), |
| 43 | + # "rms_norm": ( |
| 44 | + # "tritonbench.operators.rms_norm.operator", |
| 45 | + # "examples.rms_norm", |
| 46 | + # "rms_norm_tritonbench", |
| 47 | + # ), |
| 48 | + # "sum": ("tritonbench.operators.sum.operator", "examples.sum", "sum_tritonbench"), |
| 49 | + # "softmax": ( |
| 50 | + # "tritonbench.operators.softmax.operator", |
| 51 | + # "examples.softmax", |
| 52 | + # "softmax", |
| 53 | + # ), |
| 54 | + # "jagged_mean": ( |
| 55 | + # "tritonbench.operators.jagged_mean.operator", |
| 56 | + # "examples.jagged_mean", |
| 57 | + # "jagged_mean_tritonbench", |
| 58 | + # ), |
| 59 | + # "cross_entropy": ( |
| 60 | + # "tritonbench.operators.cross_entropy.operator", |
| 61 | + # "examples.cross_entropy", |
| 62 | + # "cross_entropy", |
| 63 | + # ), |
| 64 | + # "layer_norm": ( |
| 65 | + # "tritonbench.operators.layer_norm.operator", |
| 66 | + # "examples.layer_norm", |
| 67 | + # "layer_norm_fwd", |
| 68 | + # ), |
| 69 | + # Multiple kernel variants: |
| 70 | + "gemm": ( |
| 71 | + "tritonbench.operators.gemm.operator", |
| 72 | + [ |
| 73 | + ("examples.matmul", "matmul_tritonbench"), |
| 74 | + ("examples.matmul_split_k", "matmul_split_k_tritonbench"), |
| 75 | + ], |
63 | 76 | ),
|
64 | 77 | "flash_attention": (
|
65 | 78 | "tritonbench.operators.flash_attention.operator",
|
66 | 79 | "examples.attention",
|
67 | 80 | "attention",
|
68 | 81 | ),
|
69 |
| - "cross_entropy": ( |
70 |
| - "tritonbench.operators.cross_entropy.operator", |
71 |
| - "examples.cross_entropy", |
72 |
| - "cross_entropy", |
| 82 | + "fp8_gemm": ( |
| 83 | + "tritonbench.operators.fp8_gemm.fp8_gemm", |
| 84 | + "examples.fp8_gemm", |
| 85 | + "fp8_gemm_tritonbench", |
73 | 86 | ),
|
74 | 87 | "fp8_attention": (
|
75 | 88 | "tritonbench.operators.fp8_attention.operator",
|
76 | 89 | "examples.fp8_attention",
|
77 | 90 | "fp8_attention_tritonbench",
|
78 | 91 | ),
|
79 |
| - "layer_norm": ( |
80 |
| - "tritonbench.operators.layer_norm.operator", |
81 |
| - "examples.layer_norm", |
82 |
| - "layer_norm_fwd", |
83 |
| - ), |
84 |
| - # Multiple kernel variants: |
85 |
| - "gemm": ( |
86 |
| - "tritonbench.operators.gemm.operator", |
87 |
| - [ |
88 |
| - ("examples.matmul", "matmul_tritonbench"), |
89 |
| - ("examples.matmul_split_k", "matmul_split_k_tritonbench"), |
90 |
| - ], |
91 |
| - ), |
92 | 92 | }
|
93 | 93 |
|
94 | 94 |
|
|
0 commit comments