File tree Expand file tree Collapse file tree 2 files changed +5
-6
lines changed
Expand file tree Collapse file tree 2 files changed +5
-6
lines changed Original file line number Diff line number Diff line change @@ -3316,12 +3316,10 @@ def test_eagle3(self):
33163316 spec_config = EagleDecodingConfig (max_draft_len = draft_len ,
33173317 speculative_model_dir = eagle_model_dir )
33183318
3319- llm = LLM (model = target_model_dir ,
3320- ** pytorch_config ,
3321- kv_cache_config = kv_cache_config ,
3322- speculative_config = spec_config )
3323-
3324- with llm :
3319+ with LLM (model = target_model_dir ,
3320+ ** pytorch_config ,
3321+ kv_cache_config = kv_cache_config ,
3322+ speculative_config = spec_config ) as llm :
33253323 task = GSM8K (self .MODEL_NAME )
33263324 task .evaluate (llm )
33273325
Original file line number Diff line number Diff line change @@ -229,6 +229,7 @@ accuracy/test_llm_api_pytorch.py::TestQwen3_30B_A3B::test_w4a8_mxfp4[mxfp8-laten
229229accuracy/test_llm_api_pytorch.py::TestQwen3_8B::test_fp8_block_scales[latency]
230230accuracy/test_llm_api_pytorch.py::TestQwen3_8B::test_w4a8_mxfp4[fp8-latency]
231231accuracy/test_llm_api_pytorch.py::TestQwen3_8B::test_w4a8_mxfp4[mxfp8-latency]
232+ accuracy/test_llm_api_pytorch.py::TestQwen3_4B::test_eagle3
232233accuracy/test_llm_api_pytorch.py::TestSeedOss_36B::test_auto_dtype
233234
234235accuracy/test_llm_api_pytorch_multimodal.py::TestQwen2_VL_7B::test_auto_dtype
You can’t perform that action at this time.
0 commit comments