Skip to content

Commit 3299041

Browse files
committed
版本v0.4.7
1 parent 6782f6c commit 3299041

File tree

5 files changed

+489
-404
lines changed

5 files changed

+489
-404
lines changed

gpt_server/model_backend/vllm_backend.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -21,7 +21,7 @@
2121

2222
ray.init(ignore_reinit_error=True, num_cpus=4)
2323

24-
os.environ["VLLM_USE_V1"] = "0"
24+
os.environ["VLLM_USE_V1"] = "1"
2525

2626

2727
class VllmBackend(ModelBackend):
@@ -100,6 +100,7 @@ async def stream_chat(self, params: Dict[str, Any]) -> AsyncGenerator:
100100
chat_template=tokenizer.get_chat_template(),
101101
add_generation_prompt=True,
102102
tools=tools,
103+
model_config=await self.engine.get_model_config(),
103104
)
104105
mm_data = await mm_data_future
105106
inputs = {"multi_modal_data": mm_data, "prompt": prompt}

gpt_server/model_worker/spark_tts.py

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -11,7 +11,7 @@
1111
root_dir = os.path.dirname(os.path.dirname(os.path.dirname(__file__)))
1212

1313

14-
os.environ["VLLM_USE_V1"] = "0"
14+
os.environ["VLLM_USE_V1"] = "1"
1515
import httpx
1616
from fastapi import HTTPException
1717
import base64
@@ -91,6 +91,7 @@ def __init__(
9191
)
9292
)
9393
logger.warning(f"模型:{model_names[0]}")
94+
logger.info(f"list_speakers: {self.engine.list_speakers()}")
9495

9596
# 这个是模型主要的方法
9697
async def generate_voice_stream(self, params):
@@ -109,7 +110,7 @@ async def stream_async(self, params):
109110
format=response_format, sample_rate=self.engine.SAMPLE_RATE
110111
)
111112
generator = None
112-
if voice in self.engine.list_roles():
113+
if voice in self.engine.list_speakers():
113114
generator = self.engine.speak_stream_async(
114115
name=voice,
115116
text=text,

pyproject.toml

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
[project]
22
name = "gpt_server"
3-
version = "0.4.6"
3+
version = "0.4.7"
44
description = "gpt_server是一个用于生产级部署LLMs或Embedding的开源框架。"
55
readme = "README.md"
66
license = { text = "Apache 2.0" }
@@ -19,28 +19,28 @@ dependencies = [
1919
"streamlit==1.39.0",
2020
"torch==2.6.0",
2121
"torchvision==0.20.1",
22-
"vllm==0.8.5.post1",
22+
"vllm==0.9.0.1",
2323
"qwen_vl_utils",
24-
"evalscope[perf]==0.10.1",
24+
"evalscope[perf]==0.16.1",
2525
"modelscope==1.20.1",
2626
"edge-tts>=7.0.0",
2727
"funasr>=1.2.6",
28-
"sglang[all]>=0.4.6.post2",
28+
"sglang[all]>=0.4.6.post5",
2929
"flashinfer-python",
30-
"flashtts>=0.1.5",
30+
"flashtts>=0.1.7",
3131
]
3232

3333
[tool.uv]
3434
default-groups = [] # 默认只安装dependencies中的库
3535
override-dependencies = [
3636
"setuptools==75.2.0",
37-
"torchvision==0.21.0",
38-
"torch==2.6.0",
37+
"torchvision==0.22.0",
38+
"torch==2.7.0",
3939
"triton",
4040
"outlines==0.1.11",
4141
"transformers==4.51.3", # infinity-emb
4242
"soundfile==0.13.1", # infinity
43-
"xgrammar==0.1.18", # sglang[all]==0.4.5 depends on xgrammar==0.1.17
43+
"xgrammar==0.1.19", # sglang[all]==0.4.5 depends on xgrammar==0.1.17
4444
]
4545

4646
[project.scripts]

0 commit comments

Comments
 (0)