File tree Expand file tree Collapse file tree 4 files changed +313
-430
lines changed Expand file tree Collapse file tree 4 files changed +313
-430
lines changed Original file line number Diff line number Diff line change @@ -48,9 +48,10 @@ def __init__(
48
48
device = "cuda"
49
49
logger .warning (f"使用{ device } 加载..." )
50
50
model_type = getattr (self .model_config , "model_type" , None )
51
- bettertransformer = True
52
- if model_type is not None and "deberta" in model_type :
53
- bettertransformer = False
51
+ bettertransformer = False
52
+ # TODO bettertransformer = True transformer 出问题
53
+ # if model_type is not None and "deberta" in model_type:
54
+ # bettertransformer = False
54
55
engine_args = EngineArgs (
55
56
model_name_or_path = model_path ,
56
57
engine = "torch" ,
Original file line number Diff line number Diff line change 1
1
[project ]
2
2
name = " gpt_server"
3
- version = " 0.5.3 "
3
+ version = " 0.5.4 "
4
4
description = " gpt_server是一个用于生产级部署LLMs或Embedding的开源框架。"
5
5
readme = " README.md"
6
6
license = { text = " Apache 2.0" }
@@ -12,20 +12,20 @@ dependencies = [
12
12
" ffmpy" ,
13
13
" fschat==0.2.36" ,
14
14
" infinity-emb[all]==0.0.76" ,
15
- " lmdeploy==0.9.0 " ,
15
+ " lmdeploy==0.9.1 " ,
16
16
" loguru>=0.7.2" ,
17
17
" openai==1.86.0" ,
18
18
" setuptools==75.2.0" ,
19
19
" streamlit==1.39.0" ,
20
20
" torch==2.6.0" ,
21
21
" torchvision==0.20.1" ,
22
- " vllm==0.9.1 " ,
22
+ " vllm==0.9.2 " ,
23
23
" qwen_vl_utils" ,
24
24
" evalscope[perf,rag]==0.16.1" ,
25
25
" modelscope==1.26.0" ,
26
26
" edge-tts>=7.0.0" ,
27
27
" funasr>=1.2.6" ,
28
- " sglang[all]>=0.4.8.post1 " ,
28
+ " sglang[all]>=0.4.9.post3 " ,
29
29
" flashinfer-python" ,
30
30
" flashtts>=0.1.7" ,
31
31
" diffusers>=0.33.1" ,
@@ -39,10 +39,9 @@ override-dependencies = [
39
39
" torchaudio==2.7.1" ,
40
40
" torch==2.7.0" ,
41
41
" triton" ,
42
- " outlines==0.1.11" ,
43
- " transformers==4.51.3" , # infinity-emb
42
+ " transformers==4.53.3" , # infinity-emb
44
43
" soundfile==0.13.1" , # infinity
45
- " xgrammar==0.1.19 " , # sglang[all]==0.4.5 depends on xgrammar==0.1.17
44
+ " xgrammar==0.1.21 " , # sglang[all]==0.4.5 depends on xgrammar==0.1.17
46
45
]
47
46
48
47
[project .scripts ]
You can’t perform that action at this time.
0 commit comments