@@ -14,14 +14,14 @@ Legend:
1414
1515| Operation | BLAS | CANN | CPU | CUDA | Metal | OpenCL | SYCL | Vulkan | zDNN |
1616| -----------| ------| ------| ------| ------| ------| ------| ------| ------| ------|
17- | ABS | β | β
| β
| π‘ | π‘ | β | π‘ | β | β |
17+ | ABS | β | β
| β
| π‘ | π‘ | β | π‘ | π‘ | β |
1818| ACC | β | β
| β
| β
| β
| β | β
| β
| β |
1919| ADD | β | β
| β
| β
| π‘ | π‘ | β
| β
| β |
2020| ADD1 | β | β
| β
| β
| β | β | β
| β | β |
21- | ADD_ID | β | β | β
| β
| β | β | β | β | β |
21+ | ADD_ID | β | β | β
| β
| β | β | β | β
| β |
2222| ARANGE | β | β
| β
| β
| β
| β | β
| β | β |
2323| ARGMAX | β | β
| β
| β
| β
| β | β
| β
| β |
24- | ARGSORT | β | β
| β
| β
| β
| β
| β
| β
| β |
24+ | ARGSORT | β | β
| β
| β
| β
| β
| β
| π‘ | β |
2525| CEIL | β | β | β
| π‘ | β | β | π‘ | β | β |
2626| CLAMP | β | β
| β
| β
| π‘ | π‘ | β
| π‘ | β |
2727| CONCAT | β | β
| β
| π‘ | β
| π‘ | β
| β
| β |
@@ -30,7 +30,7 @@ Legend:
3030| CONV_2D_DW | β | β | β
| β
| β | β | β | β
| β |
3131| CONV_3D | β | β | β
| β | β | β | β | β | β |
3232| CONV_TRANSPOSE_1D | β | β
| β
| β
| β
| β | β
| β
| β |
33- | CONV_TRANSPOSE_2D | β | β | β
| β
| β | β | β | β | β |
33+ | CONV_TRANSPOSE_2D | β | β | β
| β
| β | β | β | β
| β |
3434| COS | β | β
| β
| β
| π‘ | β | β
| π‘ | β |
3535| COUNT_EQUAL | β | β
| β
| β
| β | β | β
| β
| β |
3636| CPY | β | π‘ | π‘ | π‘ | π‘ | π‘ | π‘ | π‘ | β |
@@ -41,7 +41,7 @@ Legend:
4141| DIV | β | β
| β
| β
| π‘ | π‘ | β
| β
| β |
4242| DUP | β | β
| β
| π‘ | π‘ | π‘ | β
| π‘ | β |
4343| ELU | β | β
| β
| π‘ | π‘ | β | π‘ | β | β |
44- | EXP | β | β
| β
| π‘ | π‘ | β | π‘ | β | β |
44+ | EXP | β | β
| β
| π‘ | π‘ | β | π‘ | π‘ | β |
4545| EXPM1 | β | β | β
| π‘ | β | β | β | β | β |
4646| FILL | β | β | β
| β | β | β | β | β | β |
4747| FLASH_ATTN_EXT | β | π‘ | β
| π‘ | π‘ | β | β | π‘ | β |
@@ -57,22 +57,22 @@ Legend:
5757| GET_ROWS_BACK | β | β | π‘ | π‘ | β | β | β | β | β |
5858| GROUP_NORM | β | β
| β
| β
| β
| β
| β
| β
| β |
5959| GROUP_NORM_MUL_ADD | β | β | β | β | β | β | β
| β | β |
60- | HARDSIGMOID | β | β
| β
| π‘ | π‘ | β | π‘ | β | β |
61- | HARDSWISH | β | β
| β
| π‘ | π‘ | β | π‘ | β | β |
60+ | HARDSIGMOID | β | β
| β
| π‘ | π‘ | β | π‘ | π‘ | β |
61+ | HARDSWISH | β | β
| β
| π‘ | π‘ | β | π‘ | π‘ | β |
6262| IM2COL | β | β
| β
| β
| π‘ | β
| β
| β
| β |
63- | IM2COL_3D | β | β | β
| β
| β | β | β | β | β |
63+ | IM2COL_3D | β | β | β
| β
| β | β | β | β
| β |
6464| L2_NORM | β | β | β
| β
| β
| β | β
| β
| β |
65- | LEAKY_RELU | β | β
| β
| β
| β
| β | β
| β
| β |
65+ | LEAKY_RELU | β | β
| β
| β
| β
| β | β
| π‘ | β |
6666| LOG | β | β
| β
| β
| β | β | β
| β | β |
67- | MEAN | β | β
| β
| β
| β
| β | β
| β | β |
67+ | MEAN | β | β
| β
| β
| β
| β | β
| β
| β |
6868| MUL | β | β
| β
| β
| π‘ | π‘ | β
| β
| β |
6969| MUL_MAT | π‘ | π‘ | π‘ | π‘ | π‘ | π‘ | π‘ | π‘ | π‘ |
7070| MUL_MAT_ID | β | π‘ | β
| β
| β
| π‘ | π‘ | β
| β |
71- | NEG | β | β
| β
| π‘ | π‘ | β | π‘ | β | β |
71+ | NEG | β | β
| β
| π‘ | π‘ | β | π‘ | π‘ | β |
7272| NORM | β | β
| β
| β
| π‘ | β
| β
| π‘ | β |
7373| NORM_MUL_ADD | β | β | β | β | β | β | β
| β | β |
7474| OPT_STEP_ADAMW | β | β | β
| β
| β | β | β | β
| β |
75- | OPT_STEP_SGD | β | β | β
| β
| β | β | β | β | β |
75+ | OPT_STEP_SGD | β | β | β
| β
| β | β | β | β
| β |
7676| OUT_PROD | π‘ | β | π‘ | π‘ | β | β | π‘ | β | β |
7777| PAD | β | β
| β
| π‘ | β
| β
| π‘ | β
| β |
7878| PAD_REFLECT_1D | β | β
| β
| β
| β
| β | β
| β | β |
@@ -83,7 +83,7 @@ Legend:
8383| REPEAT_BACK | β | β | β
| β
| β | β | β
| β
| β |
8484| RMS_NORM | β | β
| β
| β
| π‘ | β
| β
| β
| β |
8585| RMS_NORM_BACK | β | β | β
| β
| β | β | β
| β
| β |
86- | RMS_NORM_MUL_ADD | β | β
| β | β | β
| β
| β
| β
| β |
86+ | RMS_NORM_MUL_ADD | β | β
| β | β | β
| β
| β
| β | β |
8787| ROLL | β | β | β
| β
| β | β | β
| β
| β |
8888| ROPE | β | π‘ | β
| β
| β
| β
| β
| β
| β |
8989| ROPE_BACK | β | β | β
| β
| β | β | β | β
| β |
@@ -104,15 +104,15 @@ Legend:
104104| SOFT_MAX_BACK | β | β | π‘ | π‘ | β | β | π‘ | β
| β |
105105| SOLVE_TRI | β | β | β
| β | β | β | β | β | β |
106106| SQR | β | β
| β
| β
| π‘ | β | β
| π‘ | β |
107- | SQRT | β | β
| β
| β
| π‘ | β | β
| β | β |
107+ | SQRT | β | β
| β
| β
| π‘ | β | β
| π‘ | β |
108108| SSM_CONV | β | β | β
| β
| β
| β | β
| β
| β |
109- | SSM_SCAN | β | β | β
| β
| β
| β | β | β
| β |
109+ | SSM_SCAN | β | β | β
| β
| β
| β | β | π‘ | β |
110110| STEP | β | β
| β
| π‘ | π‘ | β | π‘ | β | β |
111111| SUB | β | β
| β
| β
| π‘ | π‘ | β
| β
| β |
112- | SUM | β | β
| β
| π‘ | β | β | π‘ | β
| β |
112+ | SUM | β | β
| β
| π‘ | β | β | π‘ | π‘ | β |
113113| SUM_ROWS | β | β
| β
| π‘ | β
| β
| π‘ | β
| β |
114114| SWIGLU | β | β
| β
| β
| π‘ | β
| β
| π‘ | β |
115- | SWIGLU_OAI | β | β | β
| β
| β | β | β | β | β |
115+ | SWIGLU_OAI | β | β | β
| β
| β | β | β | π‘ | β |
116116| TANH | β | β
| β
| π‘ | π‘ | β
| π‘ | π‘ | β |
117117| TIMESTEP_EMBEDDING | β | β
| β
| β
| β
| β
| β
| β
| β |
118118| TOPK_MOE | β | β | β | β | β | β | β
| β | β |
0 commit comments