Skip to content

Commit e1d4a47

Browse files
authored
proxy server miss media_type in streaming mode (#4130)
1 parent 3ea97b1 commit e1d4a47

File tree

1 file changed

+4
-4
lines changed

1 file changed

+4
-4
lines changed

lmdeploy/serve/proxy/proxy.py

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -587,7 +587,7 @@ async def chat_completions_v1(request: ChatCompletionRequest, raw_request: Reque
587587
if request.stream is True:
588588
response = node_manager.stream_generate(request_dict, node_url, '/v1/chat/completions')
589589
background_task = node_manager.create_background_tasks(node_url, start)
590-
return StreamingResponse(response, background=background_task)
590+
return StreamingResponse(response, background=background_task, media_type='text/event-stream')
591591
else:
592592
response = await node_manager.generate(request_dict, node_url, '/v1/chat/completions')
593593
node_manager.post_call(node_url, start)
@@ -649,7 +649,7 @@ async def chat_completions_v1(request: ChatCompletionRequest, raw_request: Reque
649649
if request.stream is True:
650650
response = node_manager.stream_generate(request_dict, d_url, '/v1/chat/completions')
651651
background_task = node_manager.create_background_tasks(d_url, start)
652-
resp = StreamingResponse(response, background=background_task)
652+
resp = StreamingResponse(response, background=background_task, media_type='text/event-stream')
653653
else:
654654
response = await node_manager.generate(request_dict, d_url, '/v1/chat/completions')
655655
node_manager.post_call(d_url, start)
@@ -717,7 +717,7 @@ async def completions_v1(request: CompletionRequest, raw_request: Request = None
717717
if request.stream is True:
718718
response = node_manager.stream_generate(request_dict, node_url, '/v1/completions')
719719
background_task = node_manager.create_background_tasks(node_url, start)
720-
return StreamingResponse(response, background=background_task)
720+
return StreamingResponse(response, background=background_task, media_type='text/event-stream')
721721
else:
722722
response = await node_manager.generate(request_dict, node_url, '/v1/completions')
723723
node_manager.post_call(node_url, start)
@@ -793,7 +793,7 @@ async def completions_v1(request: CompletionRequest, raw_request: Request = None
793793
if request.stream is True:
794794
response = node_manager.stream_generate(request_dict, d_url, '/v1/completions')
795795
background_task = node_manager.create_background_tasks(d_url, start)
796-
resp = StreamingResponse(response, background=background_task)
796+
resp = StreamingResponse(response, background=background_task, media_type='text/event-stream')
797797
else:
798798
response = await node_manager.generate(request_dict, d_url, '/v1/completions')
799799
node_manager.post_call(d_url, start)

0 commit comments

Comments
 (0)