|
55 | 55 | "tritonbench.operators.softmax.operator",
|
56 | 56 | "examples.softmax",
|
57 | 57 | "softmax",
|
| 58 | + { |
| 59 | + "only_shapes": [ |
| 60 | + [4096, 6912 * 2 - 4096], |
| 61 | + [4096, 6976 * 2 - 4096], |
| 62 | + [4096, 7040 * 2 - 4096], |
| 63 | + [4096, 7104 * 2 - 4096], |
| 64 | + [4096, 7168 * 2 - 4096], |
| 65 | + [4096, 7232 * 2 - 4096], |
| 66 | + [4096, 7296 * 2 - 4096], |
| 67 | + [4096, 7360 * 2 - 4096], |
| 68 | + [4096, 7424 * 2 - 4096], |
| 69 | + [4096, 7488 * 2 - 4096], |
| 70 | + [4096, 7552 * 2 - 4096], |
| 71 | + [4096, 7616 * 2 - 4096], |
| 72 | + [4096, 7680 * 2 - 4096], |
| 73 | + [4096, 7744 * 2 - 4096], |
| 74 | + [4096, 7808 * 2 - 4096], |
| 75 | + [4096, 7872 * 2 - 4096], |
| 76 | + [4096, 7936 * 2 - 4096], |
| 77 | + [4096, 8000 * 2 - 4096], |
| 78 | + [4096, 8064 * 2 - 4096], |
| 79 | + [4096, 8128 * 2 - 4096], |
| 80 | + [4096, 8192 * 2 - 4096], |
| 81 | + [4096, 8256 * 2 - 4096], |
| 82 | + [4096, 8320 * 2 - 4096], |
| 83 | + [4096, 8384 * 2 - 4096], |
| 84 | + ] |
| 85 | + }, |
58 | 86 | ),
|
59 | 87 | "cross_entropy": (
|
60 | 88 | "tritonbench.operators.cross_entropy.operator",
|
|
78 | 106 | "tritonbench.operators.embedding.operator",
|
79 | 107 | "examples.embedding",
|
80 | 108 | "embedding_tritonbench",
|
| 109 | + { |
| 110 | + "only_shapes": [ |
| 111 | + (8, 2048, 4096, 16384), |
| 112 | + (8, 2048, 4096, 32768), |
| 113 | + (8, 2048, 4096, 65536), |
| 114 | + (8, 2048, 4096, 131072), |
| 115 | + ] |
| 116 | + }, |
81 | 117 | ),
|
82 | 118 | "vector_exp": (
|
83 | 119 | "tritonbench.operators.vector_exp.operator",
|
84 | 120 | "examples.exp",
|
85 | 121 | "exp_tritonbench",
|
| 122 | + { |
| 123 | + "only_shapes": [ |
| 124 | + 65536, |
| 125 | + 131072, |
| 126 | + 262144, |
| 127 | + 524288, |
| 128 | + 1048576, |
| 129 | + 2097152, |
| 130 | + 4194304, |
| 131 | + 8388608, |
| 132 | + 16777216, |
| 133 | + 33554432, |
| 134 | + 67108864, |
| 135 | + 134217728, |
| 136 | + ] |
| 137 | + }, |
86 | 138 | ),
|
87 | 139 | # "fp8_gemm": (
|
88 | 140 | # "tritonbench.operators.fp8_gemm.fp8_gemm",
|
|
0 commit comments