Skip to content

Commit 861a4a5

Browse files
committed
fix embedding_vllm
1 parent 9d2fec4 commit 861a4a5

File tree

1 file changed

+1
-3
lines changed

1 file changed

+1
-3
lines changed

gpt_server/model_worker/embedding_vllm.py

Lines changed: 1 addition & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -67,14 +67,12 @@ async def get_embeddings(self, params):
6767
ret = {"embedding": [], "token_num": 0}
6868
texts: list = params["input"]
6969
if self.mode == "embedding":
70-
usage = None
7170
texts = list(map(lambda x: x.replace("\n", " "), texts))
7271
# ----------
73-
outputs = self.engine.embed(prompts=texts)
72+
outputs = self.engine.embed(texts)
7473
embedding = [o.outputs.embedding for o in outputs]
7574

7675
ret["embedding"] = embedding
77-
ret["token_num"] = usage
7876
return ret
7977

8078

0 commit comments

Comments
 (0)