@@ -190,47 +190,47 @@ jobs:
190190 python ../../scripts/build_report.py $REPORTS/matmul-performance-at.csv $REPORTS/gemm-at-onednn-report.csv --benchmark gemm-at --compiler onednn --param_cols "B,M,K,N" --tflops_col onednn-TFlops --hbm_col "onednn-GB/s" --tag $TAG
191191
192192 - name : Run Triton GEMM (stream-k) kernel benchmark
193- if : ${{ steps.install.outcome == 'success' && !cancelled() && !(inputs.only_subset || false ) }}
193+ if : ${{ steps.install.outcome == 'success' && !cancelled() && !contains (inputs.skip_benchmarks, 'gemm_streamk_benchmark.py' ) }}
194194 run : |
195195 cd benchmarks/triton_kernels_benchmark
196196 python gemm_streamk_benchmark.py --reports $REPORTS
197197 source ../../scripts/capture-hw-details.sh
198198 python ../../scripts/build_report.py $REPORTS/matmul-streamk-performance.csv $REPORTS/gemm-streamk-triton-report.csv --benchmark gemm-streamk --compiler triton --param_cols "M,K,N" --tflops_col Triton-TFlops --hbm_col "Triton-GB/s" --tag $TAG
199199
200200 - name : Run Triton GEMM (split-k) kernel benchmark
201- if : ${{ steps.install.outcome == 'success' && !cancelled() && !(inputs.only_subset || false ) }}
201+ if : ${{ steps.install.outcome == 'success' && !cancelled() && !contains (inputs.skip_benchmarks, 'gemm_splitk_benchmark.py' ) }}
202202 run : |
203203 cd benchmarks/triton_kernels_benchmark
204204 python gemm_splitk_benchmark.py --reports $REPORTS
205205 source ../../scripts/capture-hw-details.sh
206206 python ../../scripts/build_report.py $REPORTS/matmul-splitk-performance.csv $REPORTS/gemm-splitk-triton-report.csv --benchmark gemm-splitk --compiler triton --param_cols "M,K,N" --tflops_col Triton-TFlops --hbm_col "Triton-GB/s" --tag $TAG
207207
208208 - name : Run Triton GEMM + PreOp (exp) kernel benchmark
209- if : ${{ steps.install.outcome == 'success' && !cancelled() && !(inputs.only_subset || false ) }}
209+ if : ${{ steps.install.outcome == 'success' && !cancelled() && !contains (inputs.skip_benchmarks, 'gemm_preop_exp_benchmark.py' ) }}
210210 run : |
211211 cd benchmarks/triton_kernels_benchmark
212212 python gemm_preop_exp_benchmark.py --reports $REPORTS
213213 source ../../scripts/capture-hw-details.sh
214214 python ../../scripts/build_report.py $REPORTS/matmul-performance-preop-exp.csv $REPORTS/gemm-preop-exp-triton-report.csv --benchmark gemm-preop-exp --compiler triton --param_cols "B,M,K,N" --tflops_col Triton-TFlops --hbm_col "Triton-GB/s" --tag $TAG
215215
216216 - name : Run Triton GEMM + PostOp (Gelu) kernel benchmark
217- if : ${{ steps.install.outcome == 'success' && !cancelled() && !(inputs.only_subset || false ) }}
217+ if : ${{ steps.install.outcome == 'success' && !cancelled() && !contains (inputs.skip_benchmarks, 'gemm_postop_gelu_benchmark.py' ) }}
218218 run : |
219219 cd benchmarks/triton_kernels_benchmark
220220 python gemm_postop_gelu_benchmark.py --reports $REPORTS
221221 source ../../scripts/capture-hw-details.sh
222222 python ../../scripts/build_report.py $REPORTS/matmul-performance-postop-gelu.csv $REPORTS/gemm-postop-gelu-triton-report.csv --benchmark gemm-postop-gelu --compiler triton --param_cols "B,M,K,N" --tflops_col Triton-TFlops --hbm_col "Triton-GB/s" --tag $TAG
223223
224224 - name : Run Triton GEMM + PostOp (add matrix) kernel benchmark
225- if : ${{ steps.install.outcome == 'success' && !cancelled() && !(inputs.only_subset || false ) }}
225+ if : ${{ steps.install.outcome == 'success' && !cancelled() && !contains (inputs.skip_benchmarks, 'gemm_postop_addmatrix_benchmark.py' ) }}
226226 run : |
227227 cd benchmarks/triton_kernels_benchmark
228228 python gemm_postop_addmatrix_benchmark.py --reports $REPORTS
229229 source ../../scripts/capture-hw-details.sh
230230 python ../../scripts/build_report.py $REPORTS/matmul-performance-postop-addmatrix.csv $REPORTS/gemm-postop-addmatrix-triton-report.csv --benchmark gemm-postop-addmatrix --compiler triton --param_cols "B,M,K,N" --tflops_col Triton-TFlops --hbm_col "Triton-GB/s" --tag $TAG
231231
232232 - name : Run Triton FA kernel benchmark
233- if : ${{ steps.install.outcome == 'success' && !cancelled() && !(inputs.only_subset || false ) }}
233+ if : ${{ steps.install.outcome == 'success' && !cancelled() && !contains (inputs.skip_benchmarks, 'flash_attention_fwd_benchmark.py' ) }}
234234 run : |
235235 cd benchmarks/triton_kernels_benchmark
236236 python flash_attention_fwd_benchmark.py --reports $REPORTS
@@ -240,7 +240,7 @@ jobs:
240240 python ../../scripts/build_report.py $REPORTS/attn-performance.csv $REPORTS/attn-xetla-report.csv --benchmark attn --compiler xetla --param_cols "Z,H,N_CTX,D_HEAD,CAUSAL" --tflops_col XeTLA-TFlops --hbm_col "XeTLA-GB/s" --tag $TAG
241241
242242 - name : Run Triton FA kernel benchmark - default path
243- if : ${{ steps.install.outcome == 'success' && !cancelled() && !(inputs.only_subset || false ) }}
243+ if : ${{ steps.install.outcome == 'success' && !cancelled() && !contains (inputs.skip_benchmarks, 'flash_attention_fwd_benchmark.py_default' ) }}
244244 run : |
245245 cd benchmarks/triton_kernels_benchmark
246246 TRITON_INTEL_ADVANCED_PATH=0 \
@@ -253,7 +253,7 @@ jobs:
253253 python ../../scripts/build_report.py $REPORTS/attn-performance.csv $REPORTS/attn-triton-default-report.csv --benchmark attn --compiler triton --param_cols "Z,H,N_CTX,D_HEAD,CAUSAL" --tflops_col Triton-TFlops --hbm_col "Triton-GB/s" --tag $TAG
254254
255255 - name : Run Triton FA kernel benchmark - advanced path
256- if : ${{ steps.install.outcome == 'success' && !cancelled() && !(inputs.only_subset || false ) }}
256+ if : ${{ steps.install.outcome == 'success' && !cancelled() && !contains (inputs.skip_benchmarks, 'flash_attention_fwd_benchmark.py_advanced' ) }}
257257 run : |
258258 cd benchmarks/triton_kernels_benchmark
259259 TRITON_INTEL_ADVANCED_PATH=1 \
@@ -266,15 +266,15 @@ jobs:
266266 python ../../scripts/build_report.py $REPORTS/attn-performance.csv $REPORTS/attn-triton-advanced-report.csv --benchmark attn --compiler triton --param_cols "Z,H,N_CTX,D_HEAD,CAUSAL" --tflops_col Triton-TFlops --hbm_col "Triton-GB/s" --tag $TAG
267267
268268 - name : Run Prefix Sums kernel benchmark
269- if : ${{ steps.install.outcome == 'success' && !cancelled() && !(inputs.only_subset || false ) }}
269+ if : ${{ steps.install.outcome == 'success' && !cancelled() && !contains (inputs.skip_benchmarks, 'prefix_sums.py' ) }}
270270 run : |
271271 cd benchmarks/triton_kernels_benchmark
272272 python prefix_sums.py --reports $REPORTS
273273 source ../../scripts/capture-hw-details.sh
274274 python ../../scripts/build_report.py $REPORTS/prefix-sums.csv $REPORTS/prefix_sums-triton-report.csv --benchmark prefix_sums --compiler triton --param_cols "N" --tflops_col Triton-TFlops --hbm_col "Triton-GB/s" --tag $TAG
275275
276276 - name : Run micro benchmark
277- if : ${{ steps.install.outcome == 'success' && !cancelled() && !(inputs.only_subset || false ) }}
277+ if : ${{ steps.install.outcome == 'success' && !cancelled() && !contains (inputs.skip_benchmarks, 'micro_benchmarks' ) }}
278278 run : |
279279 cd benchmarks/micro_benchmarks
280280 python run_benchmarks.py --reports $REPORTS
0 commit comments