Skip to content

Commit ac404be

Browse files
committed
server : add split model test
1 parent 76b27d2 commit ac404be

File tree

1 file changed

+14
-0
lines changed

1 file changed

+14
-0
lines changed

examples/server/tests/unit/test_basic.py

Lines changed: 14 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -32,3 +32,17 @@ def test_server_models():
3232
assert res.status_code == 200
3333
assert len(res.body["data"]) == 1
3434
assert res.body["data"][0]["id"] == server.model_alias
35+
36+
def test_load_split_model():
37+
global server
38+
server.model_hf_repo = "ggml-org/models"
39+
server.model_hf_file = "tinyllamas/split/stories15M-q8_0-00001-of-00003.gguf"
40+
server.model_alias = "tinyllama-split"
41+
server.start()
42+
res = server.make_request("POST", "/completion", data={
43+
"n_predict": 16,
44+
"prompt": "Hello",
45+
"temperature": 0.0,
46+
})
47+
assert res.status_code == 200
48+
assert match_regex("(little|girl)+", res.body["content"])

0 commit comments

Comments
 (0)