Skip to content

Commit 54dc15e

Browse files
committed
fix qwen graph
Signed-off-by: taoyuxiang <[email protected]>
1 parent 0ea12cb commit 54dc15e

File tree

1 file changed

+10
-5
lines changed

1 file changed

+10
-5
lines changed

tests/e2e/multicard/test_torchair_graph_mode.py

Lines changed: 10 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -166,8 +166,13 @@ def test_e2e_pangu_with_torchair():
166166

167167
def _qwen_torchair_test_fixture(
168168
model,
169+
tp,
169170
enable_expert_parallel,
170171
):
172+
# The current access control does not support 16 cards,
173+
# so the MC2 operator in Qwen's graph mode cannot run.
174+
# Once 16-card support is available,
175+
# this e2e can be switched to graph mode.
171176
example_prompts = [
172177
"Hello, my name is",
173178
"The president of the United States is",
@@ -177,7 +182,7 @@ def _qwen_torchair_test_fixture(
177182

178183
additional_config = {
179184
"torchair_graph_config": {
180-
"enabled": True,
185+
"enabled": False,
181186
},
182187
"ascend_scheduler_config": {
183188
"enabled": True,
@@ -188,9 +193,9 @@ def _qwen_torchair_test_fixture(
188193
with VllmRunner(
189194
model,
190195
dtype="half",
191-
tensor_parallel_size=2,
196+
tensor_parallel_size=tp,
192197
distributed_executor_backend="mp",
193-
enforce_eager=False,
198+
enforce_eager=True,
194199
additional_config=additional_config,
195200
enable_expert_parallel=enable_expert_parallel,
196201
) as vllm_model:
@@ -214,8 +219,8 @@ def _qwen_torchair_test_fixture(
214219

215220

216221
def test_e2e_qwen2_with_torchair():
217-
_qwen_torchair_test_fixture("Qwen/Qwen2.5-0.5B-Instruct", False)
222+
_qwen_torchair_test_fixture("Qwen/Qwen2.5-32B-Instruct", 2, False)
218223

219224

220225
def test_e2e_qwen3_moe_with_torchair():
221-
_qwen_torchair_test_fixture("Qwen/Qwen3-30B-A3B", True)
226+
_qwen_torchair_test_fixture("Qwen/Qwen3-30B-A3B", 2, True)

0 commit comments

Comments
 (0)