@@ -44,26 +44,30 @@ def generate_data(model_output):
4444
4545
4646@app .get ("/inference_sft" )
47+ @app .post ("/inference_sft" )
4748async def inference_sft (tts_text : str = Form (), spk_id : str = Form ()):
4849 model_output = cosyvoice .inference_sft (tts_text , spk_id )
4950 return StreamingResponse (generate_data (model_output ))
5051
5152
5253@app .get ("/inference_zero_shot" )
54+ @app .post ("/inference_zero_shot" )
5355async def inference_zero_shot (tts_text : str = Form (), prompt_text : str = Form (), prompt_wav : UploadFile = File ()):
5456 prompt_speech_16k = load_wav (prompt_wav .file , 16000 )
5557 model_output = cosyvoice .inference_zero_shot (tts_text , prompt_text , prompt_speech_16k )
5658 return StreamingResponse (generate_data (model_output ))
5759
5860
5961@app .get ("/inference_cross_lingual" )
62+ @app .post ("/inference_cross_lingual" )
6063async def inference_cross_lingual (tts_text : str = Form (), prompt_wav : UploadFile = File ()):
6164 prompt_speech_16k = load_wav (prompt_wav .file , 16000 )
6265 model_output = cosyvoice .inference_cross_lingual (tts_text , prompt_speech_16k )
6366 return StreamingResponse (generate_data (model_output ))
6467
6568
6669@app .get ("/inference_instruct" )
70+ @app .post ("/inference_instruct" )
6771async def inference_instruct (tts_text : str = Form (), spk_id : str = Form (), instruct_text : str = Form ()):
6872 model_output = cosyvoice .inference_instruct (tts_text , spk_id , instruct_text )
6973 return StreamingResponse (generate_data (model_output ))
0 commit comments