Skip to content

Commit 4384377

Browse files
authored
[https://nvbugs/5601682][fix] unwaive test_disaggregated_deepseek_v3_… (#8888)
Signed-off-by: Bo Deng <[email protected]>
1 parent 0206d8d commit 4384377

File tree

3 files changed

+5
-11
lines changed

3 files changed

+5
-11
lines changed

tests/integration/defs/accuracy/test_disaggregated_serving.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -985,7 +985,7 @@ def test_chunked_prefill(self):
985985

986986

987987
@skip_pre_blackwell
988-
@pytest.mark.timeout(DEFAULT_TEST_TIMEOUT)
988+
@pytest.mark.timeout(3600)
989989
class TestQwen3_30B_A3B(LlmapiAccuracyTestHarness):
990990
FP4_MODEL = f"{llm_models_root()}/Qwen3/saved_models_Qwen3-30B-A3B_nvfp4_hf"
991991
FP8_MODEL = f"{llm_models_root()}/Qwen3/saved_models_Qwen3-30B-A3B_fp8_hf"

tests/integration/defs/disaggregated/test_disaggregated.py

Lines changed: 4 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -1289,8 +1289,7 @@ def run_disaggregated_benchmark(example_dir,
12891289
random_input_len=16,
12901290
random_output_len=64,
12911291
num_prompts=100,
1292-
max_concurrency=32,
1293-
skip_warmup=False):
1292+
max_concurrency=32):
12941293
"""Run disaggregated test with given configuration."""
12951294
run_env = env.copy()
12961295
run_env["UCX_TLS"] = "^ib"
@@ -1320,7 +1319,7 @@ def run_disaggregated_benchmark(example_dir,
13201319
stderr=subprocess.STDOUT,
13211320
env=run_env,
13221321
cwd=cwd) as server_proc):
1323-
# Ensure the sever has started
1322+
13241323
client_dir = f"{example_dir}/clients"
13251324
client_cmd = [
13261325
'python3', f'{client_dir}/disagg_client.py', '-c',
@@ -1329,7 +1328,7 @@ def run_disaggregated_benchmark(example_dir,
13291328
'--server-start-timeout',
13301329
str(server_start_timeout)
13311330
]
1332-
# Warm up
1331+
# Ensure the sever has started and workers are ready
13331332
check_call(client_cmd,
13341333
env=env,
13351334
poll_procs=[workers_proc, server_proc])
@@ -1366,9 +1365,6 @@ def run_disaggregated_benchmark(example_dir,
13661365
'--percentile-metrics',
13671366
'e2el,ttft',
13681367
]
1369-
# warm up
1370-
if not skip_warmup:
1371-
check_call(benchmark_cmd, env=env)
13721368
output = check_output(benchmark_cmd, env=env)
13731369
e2el_pattern = r"Median E2EL \(ms\):\s*(\d+\.?\d*)"
13741370
ttft_pattern = r"Median TTFT \(ms\):\s*(\d+\.?\d*)"
@@ -1513,8 +1509,7 @@ def test_disaggregated_deepseek_v3_lite_bf16_empty_batch(
15131509
num_prompts=10,
15141510
max_concurrency=10,
15151511
random_input_len=384,
1516-
random_output_len=1536,
1517-
skip_warmup=True)
1512+
random_output_len=1536)
15181513
print(f"E2EL: {e2el} ms, TTFT: {ttft} ms")
15191514

15201515
assert e2el > 0 and ttft > 0

tests/integration/test_lists/waives.txt

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -337,7 +337,6 @@ triton_server/test_triton_llm.py::test_llmapi_backend[4-0-disableDecoupleMode-te
337337
triton_server/test_triton_llm.py::test_llmapi_backend[1-0-disableDecoupleMode-tensorrt_llm] SKIP (https://nvbugs/5461874)
338338
triton_server/test_triton_llm.py::test_llmapi_backend[1-0-enableDecoupleMode-tensorrt_llm] SKIP (https://nvbugs/5461874)
339339
cpp/test_e2e.py::test_benchmarks[gpt-80] SKIP (https://nvbugs/5601670)
340-
disaggregated/test_disaggregated.py::test_disaggregated_deepseek_v3_lite_bf16_empty_batch[DeepSeek-V3-Lite-bf16] SKIP (https://nvbugs/5601682)
341340
disaggregated/test_disaggregated.py::test_disaggregated_benchmark_on_diff_backends[llama-v3-8b-hf] SKIP (https://nvbugs/5587574)
342341
full:H20-3e/accuracy/test_llm_api_pytorch.py::TestNemotronUltra::test_auto_dtype[tp8ep4-cuda_graph=True] SKIP (slow I/O)
343342
full:H20-3e/accuracy/test_llm_api_pytorch.py::TestKimiK2::test_fp8_blockscale[latency] SKIP (slow I/O)

0 commit comments

Comments
 (0)