Skip to content

Commit b25c91e

Browse files
committed
Add dsr1 and gpt-oss test cases
Signed-off-by: Chenfei Zhang <[email protected]>
1 parent b1dc8c0 commit b25c91e

File tree

5 files changed

+75
-4
lines changed

5 files changed

+75
-4
lines changed

jenkins/L0_Test.groovy

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -2698,6 +2698,7 @@ def launchTestJobs(pipeline, testFilter)
26982698
"DGX_B300-4_GPUs-PyTorch-Post-Merge-1": ["b300-x4", "l0_dgx_b300", 1, 1, 4],
26992699
// Perf sanity post merge test
27002700
"DGX_B200-4_GPUs-PyTorch-Perf-Sanity-Post-Merge-1": ["b200-x4", "perf_sanity_l0_dgx_b200", 1, 1, 4],
2701+
"DGX_B200-8_GPUs-PyTorch-Perf-Sanity-Post-Merge-1": ["b200-x8", "perf_sanity_l0_dgx_b200", 1, 1, 8],
27012702
"DGX_B300-4_GPUs-PyTorch-Perf-Sanity-Post-Merge-1": ["b300-x4", "perf_sanity_l0_dgx_b300", 1, 1, 4],
27022703
]
27032704
fullSet += x86SlurmTestConfigs.keySet()
@@ -2730,6 +2731,7 @@ def launchTestJobs(pipeline, testFilter)
27302731
// "GB300-PyTorch-1": ["gb300-single", "l0_gb300", 1, 1],
27312732
"GB200-4_GPUs-PyTorch-1": ["gb200-trtllm", "l0_gb200_multi_gpus", 1, 1, 4],
27322733
"GB200-4_GPUs-PyTorch-Post-Merge-1": ["gb200-trtllm", "l0_gb200_multi_gpus", 1, 1, 4],
2734+
"GB200-4_GPUs-PyTorch-Perf-Sanity-Post-Merge-1": ["gb200-trtllm", "perf_sanity_l0_gb200_multi_gpus", 1, 1, 4],
27332735
// "GB300-4_GPUs-PyTorch-Post-Merge-1": ["gb300-trtllm", "l0_gb300_multi_gpus", 1, 1, 4],
27342736
]
27352737
fullSet += SBSASlurmTestConfigs.keySet()

tests/integration/defs/perf/test_perf.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -687,7 +687,7 @@ def generate_extra_llm_api_config(self) -> str:
687687
config_lines.append(f" max_draft_len: {self.max_draft_len}")
688688
if self.speculative_model_dir:
689689
config_lines.append(
690-
f" speculative_model_dir: {speculative_model_dir}")
690+
f" speculative_model_dir: {self.speculative_model_dir}")
691691

692692
return "\n".join(config_lines)
693693

tests/integration/test_lists/test-db/perf_sanity_l0_dgx_b200.yml

Lines changed: 36 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@ perf_sanity_l0_dgx_b200:
1515
backend: pytorch
1616
orchestrator: mpi
1717
tests:
18-
- perf/test_perf.py::test_perf[perf_sanity_upload-l0_dgx_b200]
18+
- perf/test_perf.py::test_perf[perf_sanity_upload-l0_dgx_b200-r1_fp4_dep4,r1_fp4_tep4,r1_fp4_v2_dep4_mtp1,r1_fp4_v2_tep4_mtp3,gpt_oss_dep4,gpt_oss_tep4]
1919

2020
- condition:
2121
ranges:
@@ -32,4 +32,38 @@ perf_sanity_l0_dgx_b200:
3232
backend: pytorch
3333
orchestrator: mpi
3434
tests:
35-
- perf/test_perf.py::test_perf[perf_sanity_upload-l0_dgx_b200]
35+
- perf/test_perf.py::test_perf[perf_sanity_upload-l0_dgx_b200-r1_fp4_dep4,r1_fp4_tep4,r1_fp4_v2_dep4_mtp1,r1_fp4_v2_tep4_mtp3,gpt_oss_dep4,gpt_oss_tep4]
36+
37+
- condition:
38+
ranges:
39+
system_gpu_count:
40+
gte: 8
41+
lte: 8
42+
wildcards:
43+
gpu:
44+
- '*b200*'
45+
linux_distribution_name: ubuntu*
46+
cpu: x86_64
47+
terms:
48+
stage: pre_merge
49+
backend: pytorch
50+
orchestrator: mpi
51+
tests:
52+
- perf/test_perf.py::test_perf[perf_sanity_upload-l0_dgx_b200-r1_fp8_dep4_mtp1,r1_fp8_tep4_mtp3]
53+
54+
- condition:
55+
ranges:
56+
system_gpu_count:
57+
gte: 8
58+
lte: 8
59+
wildcards:
60+
gpu:
61+
- '*b200*'
62+
linux_distribution_name: ubuntu*
63+
cpu: x86_64
64+
terms:
65+
stage: post_merge
66+
backend: pytorch
67+
orchestrator: mpi
68+
tests:
69+
- perf/test_perf.py::test_perf[perf_sanity_upload-l0_dgx_b200-r1_fp8_dep4_mtp1,r1_fp8_tep4_mtp3]
Lines changed: 35 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,35 @@
1+
version: 0.0.1
2+
perf_sanity_l0_gb200_multi_gpus:
3+
- condition:
4+
ranges:
5+
system_gpu_count:
6+
gte: 4
7+
lte: 4
8+
wildcards:
9+
gpu:
10+
- '*gb200*'
11+
linux_distribution_name: ubuntu*
12+
cpu: aarch64
13+
terms:
14+
stage: pre_merge
15+
backend: pytorch
16+
orchestrator: mpi
17+
tests:
18+
- perf/test_perf.py::test_perf[perf_sanity_upload-l0_gb200_multi_gpus]
19+
20+
- condition:
21+
ranges:
22+
system_gpu_count:
23+
gte: 4
24+
lte: 4
25+
wildcards:
26+
gpu:
27+
- '*gb200*'
28+
linux_distribution_name: ubuntu*
29+
cpu: aarch64
30+
terms:
31+
stage: post_merge
32+
backend: pytorch
33+
orchestrator: mpi
34+
tests:
35+
- perf/test_perf.py::test_perf[perf_sanity_upload-l0_gb200_multi_gpus]

tests/scripts/perf-sanity/l0_dgx_gb200.yaml renamed to tests/scripts/perf-sanity/l0_gb200_multi_gpus.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -32,7 +32,7 @@ server_configs:
3232
- name: "r1_fp4_v2_tep4_mtp3"
3333
model_name: "deepseek_r1_0528_fp4_v2"
3434
gpus: 4
35-
tp: 4W
35+
tp: 4
3636
ep: 1
3737
pp: 1
3838
attention_backend: "TRTLLM"

0 commit comments

Comments
 (0)