Skip to content

Commit d47360e

Browse files
committed
update test
1 parent 5ffc2a0 commit d47360e

File tree

1 file changed

+4
-3
lines changed

1 file changed

+4
-3
lines changed

examples/server/tests/unit/test_infill.py

Lines changed: 4 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -61,10 +61,11 @@ def test_invalid_input_extra_req(input_extra):
6161
def test_with_qwen_model():
6262
global server
6363
server.model_file = None
64-
server.model_hf_repo = "Qwen/Qwen2.5-Coder-1.5B-Instruct-GGUF"
65-
server.model_hf_file = "qwen2.5-coder-1.5b-instruct-q2_k.gguf"
64+
server.model_hf_repo = "ggml-org/Qwen2.5-Coder-1.5B-IQ3_XXS-GGUF"
65+
server.model_hf_file = "qwen2.5-coder-1.5b-iq3_xxs-imat.gguf"
6666
server.start(timeout_seconds=600)
6767
res = server.make_request("POST", "/infill", data={
68+
# "prompt": "Complete this", # FIXME: add more complicated prompt when format_infill is fixed
6869
"input_extra": [{
6970
"filename": "llama.h",
7071
"text": "LLAMA_API int32_t llama_n_threads();\n"
@@ -73,4 +74,4 @@ def test_with_qwen_model():
7374
"input_suffix": "}\n",
7475
})
7576
assert res.status_code == 200
76-
assert res.body["content"].startswith("n_threads")
77+
assert res.body["content"] == "n_threads();\n printf(\"Number of threads: %d\\n\", n_threads);\n return 0;\n"

0 commit comments

Comments
 (0)