|
46 | 46 |
|
47 | 47 | PARAMS_MODELS_BACKENDS_TOKENIZER_MODE = [ |
48 | 48 | ("mistralai/Ministral-8B-Instruct-2410", "xgrammar", "auto", None), |
49 | | - ("mistralai/Ministral-8B-Instruct-2410", "guidance", "auto", None), |
| 49 | + # FIXME: Since "auto" will use Mistral tokenizer and these backends do not support |
| 50 | + # it, we skip these tests for now. |
| 51 | + # ("mistralai/Ministral-8B-Instruct-2410", "guidance", "auto", None), |
| 52 | + # ("mistralai/Ministral-8B-Instruct-2410", "lm-format-enforcer", "auto", None), |
| 53 | + ("mistralai/Ministral-8B-Instruct-2410", "guidance", "hf", None), |
50 | 54 | pytest.param( |
51 | 55 | "mistralai/Ministral-8B-Instruct-2410", |
52 | 56 | "lm-format-enforcer", |
53 | | - "auto", |
| 57 | + "hf", |
54 | 58 | None, |
55 | 59 | marks=pytest.mark.skip( |
56 | 60 | reason=( |
|
80 | 84 | # ("mistralai/Ministral-8B-Instruct-2410", "outlines", "mistral", None), |
81 | 85 | # ("Qwen/Qwen2.5-1.5B-Instruct", "guidance", "auto"), |
82 | 86 | ("mistralai/Ministral-8B-Instruct-2410", "outlines", "auto", NGRAM_SPEC_CONFIG), |
83 | | - ("mistralai/Ministral-8B-Instruct-2410", "guidance", "auto", NGRAM_SPEC_CONFIG), |
| 87 | + ("mistralai/Ministral-8B-Instruct-2410", "guidance", "hf", NGRAM_SPEC_CONFIG), |
84 | 88 | ("Qwen/Qwen2.5-1.5B-Instruct", "xgrammar", "auto", NGRAM_SPEC_CONFIG), |
85 | 89 | ("meta-llama/Meta-Llama-3.1-8B-Instruct", "xgrammar", "auto", EAGLE_SPEC_CONFIG), |
86 | 90 | ] |
@@ -151,6 +155,8 @@ def test_structured_output( |
151 | 155 | ), |
152 | 156 | seed=120, |
153 | 157 | tokenizer_mode=tokenizer_mode, |
| 158 | + load_format="auto" if not model_name.startswith("mistralai/") else "hf", |
| 159 | + config_format="auto" if not model_name.startswith("mistralai/") else "hf", |
154 | 160 | speculative_config=speculative_config, |
155 | 161 | ) |
156 | 162 |
|
@@ -720,6 +726,8 @@ def test_structured_output_auto_mode( |
720 | 726 | max_model_len=1024, |
721 | 727 | structured_outputs_config=dict(backend="auto"), |
722 | 728 | tokenizer_mode=tokenizer_mode, |
| 729 | + load_format="auto", |
| 730 | + config_format="auto", |
723 | 731 | ) |
724 | 732 |
|
725 | 733 | sampling_params = SamplingParams( |
|
0 commit comments