We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 76b27d2 commit ac404beCopy full SHA for ac404be
examples/server/tests/unit/test_basic.py
@@ -32,3 +32,17 @@ def test_server_models():
32
assert res.status_code == 200
33
assert len(res.body["data"]) == 1
34
assert res.body["data"][0]["id"] == server.model_alias
35
+
36
+def test_load_split_model():
37
+ global server
38
+ server.model_hf_repo = "ggml-org/models"
39
+ server.model_hf_file = "tinyllamas/split/stories15M-q8_0-00001-of-00003.gguf"
40
+ server.model_alias = "tinyllama-split"
41
+ server.start()
42
+ res = server.make_request("POST", "/completion", data={
43
+ "n_predict": 16,
44
+ "prompt": "Hello",
45
+ "temperature": 0.0,
46
+ })
47
+ assert res.status_code == 200
48
+ assert match_regex("(little|girl)+", res.body["content"])
0 commit comments