@@ -72,6 +72,14 @@ async def inference_instruct(tts_text: str = Form(), spk_id: str = Form(), instr
7272 model_output = cosyvoice .inference_instruct (tts_text , spk_id , instruct_text )
7373 return StreamingResponse (generate_data (model_output ))
7474
75+ @app .get ("/inference_instruct2" )
76+ @app .post ("/inference_instruct2" )
77+ async def inference_instruct2 (tts_text : str = Form (), instruct_text : str = Form (), prompt_wav : UploadFile = File ()):
78+ prompt_speech_16k = load_wav (prompt_wav .file , 16000 )
79+ model_output = cosyvoice .inference_instruct2 (tts_text , instruct_text , prompt_speech_16k )
80+ return StreamingResponse (generate_data (model_output ))
81+
82+
7583
7684if __name__ == '__main__' :
7785 parser = argparse .ArgumentParser ()
@@ -80,14 +88,14 @@ async def inference_instruct(tts_text: str = Form(), spk_id: str = Form(), instr
8088 default = 50000 )
8189 parser .add_argument ('--model_dir' ,
8290 type = str ,
83- default = 'iic/CosyVoice-300M ' ,
91+ default = 'pretrained_models/CosyVoice2-0.5B ' ,
8492 help = 'local path or modelscope repo id' )
8593 args = parser .parse_args ()
8694 try :
8795 cosyvoice = CosyVoice (args .model_dir )
8896 except Exception :
8997 try :
90- cosyvoice = CosyVoice2 (args .model_dir )
98+ cosyvoice = CosyVoice2 (args .model_dir , load_jit = True , load_trt = False )
9199 except Exception :
92100 raise TypeError ('no valid model_type!' )
93- uvicorn .run (app , host = "0.0.0.0" , port = args .port )
101+ uvicorn .run (app , host = "0.0.0.0" , port = args .port )
0 commit comments