@@ -587,7 +587,7 @@ async def chat_completions_v1(request: ChatCompletionRequest, raw_request: Reque
587587 if request .stream is True :
588588 response = node_manager .stream_generate (request_dict , node_url , '/v1/chat/completions' )
589589 background_task = node_manager .create_background_tasks (node_url , start )
590- return StreamingResponse (response , background = background_task )
590+ return StreamingResponse (response , background = background_task , media_type = 'text/event-stream' )
591591 else :
592592 response = await node_manager .generate (request_dict , node_url , '/v1/chat/completions' )
593593 node_manager .post_call (node_url , start )
@@ -649,7 +649,7 @@ async def chat_completions_v1(request: ChatCompletionRequest, raw_request: Reque
649649 if request .stream is True :
650650 response = node_manager .stream_generate (request_dict , d_url , '/v1/chat/completions' )
651651 background_task = node_manager .create_background_tasks (d_url , start )
652- resp = StreamingResponse (response , background = background_task )
652+ resp = StreamingResponse (response , background = background_task , media_type = 'text/event-stream' )
653653 else :
654654 response = await node_manager .generate (request_dict , d_url , '/v1/chat/completions' )
655655 node_manager .post_call (d_url , start )
@@ -717,7 +717,7 @@ async def completions_v1(request: CompletionRequest, raw_request: Request = None
717717 if request .stream is True :
718718 response = node_manager .stream_generate (request_dict , node_url , '/v1/completions' )
719719 background_task = node_manager .create_background_tasks (node_url , start )
720- return StreamingResponse (response , background = background_task )
720+ return StreamingResponse (response , background = background_task , media_type = 'text/event-stream' )
721721 else :
722722 response = await node_manager .generate (request_dict , node_url , '/v1/completions' )
723723 node_manager .post_call (node_url , start )
@@ -793,7 +793,7 @@ async def completions_v1(request: CompletionRequest, raw_request: Request = None
793793 if request .stream is True :
794794 response = node_manager .stream_generate (request_dict , d_url , '/v1/completions' )
795795 background_task = node_manager .create_background_tasks (d_url , start )
796- resp = StreamingResponse (response , background = background_task )
796+ resp = StreamingResponse (response , background = background_task , media_type = 'text/event-stream' )
797797 else :
798798 response = await node_manager .generate (request_dict , d_url , '/v1/completions' )
799799 node_manager .post_call (d_url , start )
0 commit comments