Skip to content

Commit 5ff244c

Browse files
authored
[https://nvbugs/5837281][fix] Fix trtllm-serve guided decoding test (#11101)
Signed-off-by: Enwei Zhu <21126786+syuoni@users.noreply.github.com>
1 parent 9959a5c commit 5ff244c

File tree

3 files changed

+9
-3
lines changed

3 files changed

+9
-3
lines changed

tests/integration/defs/test_e2e.py

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1736,8 +1736,10 @@ def test_openai_mmencoder_example(llm_root, llm_venv):
17361736
str(test_root / "_test_openai_mmencoder.py")])
17371737

17381738

1739-
@pytest.mark.parametrize(
1740-
"model_name", ["meta-llama/Llama-3.1-8B-Instruct", "openai/gpt-oss-120b"])
1739+
@pytest.mark.parametrize("model_name", [
1740+
"meta-llama/Llama-3.1-8B-Instruct",
1741+
pytest.param("openai/gpt-oss-120b", marks=skip_pre_hopper)
1742+
])
17411743
def test_openai_chat_guided_decoding(llm_root, llm_venv, model_name: str):
17421744
test_root = unittest_path() / "llmapi" / "apps"
17431745
llm_venv.run_cmd([

tests/integration/test_lists/waives.txt

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -344,7 +344,6 @@ examples/test_llama.py::test_llama_3_x_with_bf16_lora_torch[llama-3.2-1b-instruc
344344
accuracy/test_llm_api_autodeploy.py::TestNemotronSuperV3::test_bf16 SKIP (https://nvbugs/5838184)
345345
cpp/test_multi_gpu.py::test_cache_transceiver[8proc-mooncake_kvcache-90] SKIP (https://nvbugs/5838199)
346346
accuracy/test_llm_api_pytorch.py::TestGPTOSS::test_w4_4gpus[dp4-cutlass-auto] SKIP (https://nvbugs/5838211)
347-
test_e2e.py::test_openai_chat_guided_decoding[openai/gpt-oss-120b] SKIP (https://nvbugs/5836594)
348347
test_e2e.py::test_ptp_quickstart_advanced_ngram[Llama-3.1-8B-Instruct-llama-3.1-model/Llama-3.1-8B-Instruct] SKIP (https://nvbugs/5843112)
349348
accuracy/test_llm_api_pytorch.py::TestDeepSeekR1::test_fp8_blockscale[throughput_mtp] SKIP (https://nvbugs/5839028)
350349
unittest/kv_cache_manager_v2_tests/test_kv_cache_manager_v2.py::TestNoBatching::test_naive_0 SKIP (https://nvbugs/5841954)

tests/unittest/llmapi/apps/_test_openai_chat_guided_decoding.py

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -9,11 +9,16 @@
99
import openai
1010
import pytest
1111
import yaml
12+
from utils.llm_data import llm_datasets_root
1213

1314
from ..test_llm import get_model_path
1415
from .openai_server import RemoteOpenAIServer
1516

1617
pytestmark = pytest.mark.threadleak(enabled=False)
18+
os.environ['TIKTOKEN_RS_CACHE_DIR'] = os.path.join(llm_datasets_root(),
19+
'tiktoken_vocab')
20+
os.environ['TIKTOKEN_ENCODINGS_BASE'] = os.path.join(llm_datasets_root(),
21+
'tiktoken_vocab')
1722

1823

1924
@pytest.fixture(

0 commit comments

Comments
 (0)