File tree Expand file tree Collapse file tree 5 files changed +99
-69
lines changed Expand file tree Collapse file tree 5 files changed +99
-69
lines changed Original file line number Diff line number Diff line change @@ -99,5 +99,5 @@ def get_embedding_mode(model_path: str):
99
99
if __name__ == "__main__" :
100
100
101
101
# 示例用法
102
- r = get_embedding_mode ("/home/dev/model/BAAI/bge-m3 /" )
102
+ r = get_embedding_mode ("/home/dev/model/Qwen/Qwen3-Reranker-0___6B /" )
103
103
print (r )
Original file line number Diff line number Diff line change 1
1
from typing import Tuple
2
2
3
- __version__ = "0.3.7 "
3
+ __version__ = "0.6.0 "
4
4
short_version = __version__
5
5
6
6
Original file line number Diff line number Diff line change 1
1
[project ]
2
2
name = " gpt_server"
3
- version = " 0.5.4 "
3
+ version = " 0.6.0 "
4
4
description = " gpt_server是一个用于生产级部署LLMs或Embedding的开源框架。"
5
5
readme = " README.md"
6
6
license = { text = " Apache 2.0" }
@@ -12,7 +12,7 @@ dependencies = [
12
12
" ffmpy" ,
13
13
" fschat==0.2.36" ,
14
14
" infinity-emb[all]==0.0.76" ,
15
- " lmdeploy==0.9.1 " ,
15
+ " lmdeploy==0.9.2 " ,
16
16
" loguru>=0.7.2" ,
17
17
" openai==1.86.0" ,
18
18
" setuptools==75.2.0" ,
@@ -25,7 +25,7 @@ dependencies = [
25
25
" modelscope==1.26.0" ,
26
26
" edge-tts>=7.0.0" ,
27
27
" funasr>=1.2.6" ,
28
- " sglang[all]>=0.4.9.post3 " ,
28
+ " sglang[all]>=0.4.10 " ,
29
29
" flashinfer-python" ,
30
30
" flashtts>=0.1.7" ,
31
31
" diffusers>=0.33.1" ,
@@ -42,6 +42,7 @@ override-dependencies = [
42
42
" transformers==4.53.3" , # infinity-emb
43
43
" soundfile==0.13.1" , # infinity
44
44
" xgrammar==0.1.21" , # sglang[all]==0.4.5 depends on xgrammar==0.1.17
45
+ " flashinfer-python==0.2.10" ,
45
46
]
46
47
47
48
[project .scripts ]
You can’t perform that action at this time.
0 commit comments