Skip to content

Commit be54f8e

Browse files
authored
[Fix] Change /generate response-type to json for non-streaming (#374)
1 parent b396cb4 commit be54f8e

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

vllm/entrypoints/api_server.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,7 @@
33
from typing import AsyncGenerator
44

55
from fastapi import BackgroundTasks, FastAPI, Request
6-
from fastapi.responses import Response, StreamingResponse
6+
from fastapi.responses import JSONResponse, Response, StreamingResponse
77
import uvicorn
88

99
from vllm.engine.arg_utils import AsyncEngineArgs
@@ -64,7 +64,7 @@ async def abort_request() -> None:
6464
prompt = final_output.prompt
6565
text_outputs = [prompt + output.text for output in final_output.outputs]
6666
ret = {"text": text_outputs}
67-
return Response(content=json.dumps(ret))
67+
return JSONResponse(ret)
6868

6969

7070
if __name__ == "__main__":

0 commit comments

Comments
 (0)