Skip to content

Commit 9e859f6

Browse files
authored
[nightly] Fix linting and oss tags (#653)
1 parent 308b043 commit 9e859f6

File tree

5 files changed

+273
-131
lines changed

5 files changed

+273
-131
lines changed

.github/workflows/nightly.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -35,7 +35,7 @@ jobs:
3535
h100-triton-main-nightly-benchmark:
3636
uses: ./.github/workflows/_linux-benchmark-h100.yml
3737
with:
38-
test_type: ${{ inputs.test_type }}
38+
test_type: ${{ inputs.test_type || 'periodic' }}
3939
benchmark_name: "nightly"
4040
side_a_triton: ${{ inputs.side_a_triton }}
4141
side_a_commit: ${{ inputs.side_a_commit }}
@@ -46,7 +46,7 @@ jobs:
4646
mi350-triton-main-nightly-benchmark:
4747
uses: ./.github/workflows/_linux-benchmark-mi350.yml
4848
with:
49-
test_type: ${{ inputs.test_type }}
49+
test_type: ${{ inputs.test_type || 'periodic' }}
5050
benchmark_name: "nightly"
5151
side_a_triton: ${{ inputs.side_a_triton }}
5252
side_a_commit: ${{ inputs.side_a_commit }}

benchmarks/nightly/autogen.yaml

Lines changed: 14 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -38,9 +38,16 @@ fp8_gemm_fwd:
3838
args: --op fp8_gemm --baseline torch_fp8_gemm --metrics latency,tflops,speedup --only
3939
triton_fp8_gemm,triton_persistent_fp8_gemm,triton_tma_persistent_fp8_gemm,torch_fp8_gemm
4040
disabled: true
41+
fp8_gemm_blockwise_fwd:
42+
args: --op fp8_gemm_blockwise --baseline _cutlass --metrics latency,tflops,speedup
43+
--only _triton,_cutlass
4144
fp8_gemm_rowwise_fwd:
4245
args: --op fp8_gemm_rowwise --baseline _cutlass_or_ck --metrics latency,tflops,speedup
43-
--only _aoti_fp8_triton_mm,_cutlass_or_ck
46+
--only _aoti_fp8_triton_mm,_triton,_cutlass_or_ck
47+
disabled: true
48+
fp8_gemm_rowwise_grouped_fwd:
49+
args: --op fp8_gemm_rowwise_grouped --baseline eager_fp8_gemm_rowwise_grouped --metrics
50+
latency,tflops,speedup --only _triton,eager_fp8_gemm_rowwise_grouped
4451
disabled: true
4552
fused_linear_cross_entropy_fwd:
4653
args: --op fused_linear_cross_entropy --baseline torch_lm_head_ce --metrics latency,speedup
@@ -57,6 +64,11 @@ fused_linear_jsd_bwd:
5764
gather_gemv_fwd:
5865
args: --op gather_gemv --baseline eager_gather_gemv --metrics latency,speedup --only
5966
triton_gather_gemv,eager_gather_gemv
67+
bf16_gdpa_fwd:
68+
args: --op gdpa --baseline eager_gdpa --metrics latency,speedup --only gdpa,gdpa_opt,gdpa_opt_sorted,eager_gdpa
69+
bf16_gdpa_bwd:
70+
args: --op gdpa --baseline eager_gdpa --metrics latency,speedup --only gdpa,gdpa_opt,gdpa_opt_sorted,eager_gdpa
71+
--bwd
6072
geglu_fwd:
6173
args: --op geglu --baseline torch_geglu --metrics latency,speedup --only liger_geglu,torch_geglu
6274
geglu_bwd:
@@ -69,7 +81,7 @@ fp16_gemm_bwd:
6981
--bwd
7082
bf16_grouped_gemm_fwd:
7183
args: --op grouped_gemm --baseline aten_grouped_mm --metrics latency,tflops,speedup
72-
--only triton_grouped_gemm,aten_grouped_mm
84+
--only precompiled_cutedsl_grouped_mm_tuned,tlx_grouped_gemm,triton_grouped_gemm,aten_grouped_mm
7385
int4_gemm_fwd:
7486
args: --op int4_gemm --baseline eager_int4_gemm --metrics latency,tflops,speedup
7587
--only preprocessed_triton_int4_gemm,triton_int4_gemm,eager_int4_gemm

benchmarks/tagging/ast_analyzer.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -62,6 +62,8 @@ class Edge:
6262

6363

6464
def split_by_the_last_dot(s: str) -> Optional[Tuple[str, str]]:
65+
if s == None:
66+
return None, None
6567
if "." in s:
6668
return s.rsplit(".", 1)
6769
else:

0 commit comments

Comments
 (0)