@@ -115,8 +115,8 @@ jobs:
115115 cd benchmarks/triton_kernels_benchmark
116116 python gemm_benchmark.py --reports $REPORTS
117117 mv $REPORTS/matmul-performance.csv $REPORTS/matmul-performance-base.csv
118- source ../../scripts/capture-hw-details.sh
119118
119+ source ../../scripts/capture-hw-details.sh
120120 TAG=${{ inputs.tag || 'ci' }}
121121 python ../../scripts/build_report.py $REPORTS/matmul-performance-base.csv $REPORTS/gemm-triton-report.csv --benchmark gemm --compiler triton --param_cols "B,M,K,N" --tflops_col Triton-TFlops --hbm_col "Triton-GB/s" --tag $TAG
122122 python ../../scripts/build_report.py $REPORTS/matmul-performance-base.csv $REPORTS/gemm-xetla-report.csv --benchmark gemm --compiler xetla --param_cols "B,M,K,N" --tflops_col XeTLA-TFlops --hbm_col "XeTLA-GB/s" --tag $TAG
@@ -133,8 +133,8 @@ jobs:
133133 python gemm_benchmark.py --reports $REPORTS
134134 mv $REPORTS/matmul-performance.csv $REPORTS/matmul-performance-default-path.csv
135135
136- TAG=${{ inputs.tag || 'ci' }}-dflt
137136 source ../../scripts/capture-hw-details.sh
137+ TAG=${{ inputs.tag || 'ci' }}-dflt
138138 python ../../scripts/build_report.py $REPORTS/matmul-performance-default-path.csv $REPORTS/gemm-triton-default-report.csv --benchmark gemm --compiler triton --param_cols "B,M,K,N" --tflops_col Triton-TFlops --hbm_col "Triton-GB/s" --tag $TAG
139139
140140 - name : Run Triton GEMM kernel benchmark - advanced path
@@ -149,10 +149,28 @@ jobs:
149149 python gemm_benchmark.py --reports $REPORTS
150150 mv $REPORTS/matmul-performance.csv $REPORTS/matmul-performance-adv-path.csv
151151
152- TAG=${{ inputs.tag || 'ci' }}-adv
153152 source ../../scripts/capture-hw-details.sh
153+ TAG=${{ inputs.tag || 'ci' }}-adv
154154 python ../../scripts/build_report.py $REPORTS/matmul-performance-adv-path.csv $REPORTS/gemm-triton-advanced-report.csv --benchmark gemm --compiler triton --param_cols "B,M,K,N" --tflops_col Triton-TFlops --hbm_col "Triton-GB/s" --tag $TAG
155155
156+ - name : Run Triton GEMM (stream-k) kernel benchmark
157+ if : ${{ steps.install.outcome == 'success' && !cancelled() }}
158+ run : |
159+ cd benchmarks/triton_kernels_benchmark
160+ python gemm_streamk_benchmark.py --reports $REPORTS
161+ source ../../scripts/capture-hw-details.sh
162+ TAG=${{ inputs.tag || 'ci' }}
163+ python ../../scripts/build_report.py $REPORTS/matmul-streamk-performance.csv $REPORTS/gemm-streamk-triton-report.csv --benchmark gemm-streamk --compiler triton --param_cols "M,K,N" --tflops_col Triton-TFlops --hbm_col "Triton-GB/s" --tag $TAG
164+
165+ - name : Run Triton GEMM (split-k) kernel benchmark
166+ if : ${{ steps.install.outcome == 'success' && !cancelled() }}
167+ run : |
168+ cd benchmarks/triton_kernels_benchmark
169+ python gemm_splitk_benchmark.py --reports $REPORTS
170+ source ../../scripts/capture-hw-details.sh
171+ TAG=${{ inputs.tag || 'ci' }}
172+ python ../../scripts/build_report.py $REPORTS/matmul-splitk-performance.csv $REPORTS/gemm-splitk-triton-report.csv --benchmark gemm-splitk --compiler triton --param_cols "M,K,N" --tflops_col Triton-TFlops --hbm_col "Triton-GB/s" --tag $TAG
173+
156174 - name : Run Triton GEMM + PreOp (exp) kernel benchmark
157175 if : ${{ steps.install.outcome == 'success' && !cancelled() }}
158176 run : |
0 commit comments