@@ -230,6 +230,7 @@ def setup(
230
230
enkws = True ,
231
231
max_token_len = 127 ,
232
232
request_id = "llm_setup" ,
233
+ ** kwargs ,
233
234
) -> str :
234
235
cmd = {
235
236
"request_id" : request_id ,
@@ -246,6 +247,7 @@ def setup(
246
247
"prompt" : prompt ,
247
248
},
248
249
}
250
+ cmd ["data" ].update (kwargs )
249
251
success = self ._module_msg .send_cmd_and_wait_to_take_msg (
250
252
ujson .dumps (cmd ), request_id , self ._set_llm_work_id , 30000
251
253
)
@@ -321,6 +323,7 @@ def setup(
321
323
enoutput = True ,
322
324
max_token_len = 256 ,
323
325
request_id = "vlm_setup" ,
326
+ ** kwargs ,
324
327
) -> str :
325
328
cmd = {
326
329
"request_id" : request_id ,
@@ -336,6 +339,7 @@ def setup(
336
339
"prompt" : prompt ,
337
340
},
338
341
}
342
+ cmd ["data" ].update (kwargs )
339
343
success = self ._module_msg .send_cmd_and_wait_to_take_msg (
340
344
ujson .dumps (cmd ), request_id , self ._set_llm_work_id , 30000
341
345
)
@@ -420,6 +424,7 @@ def setup(
420
424
playdevice = 1 ,
421
425
play_volume = 0.15 ,
422
426
request_id = "audio_setup" ,
427
+ ** kwargs ,
423
428
) -> str :
424
429
cmd = {
425
430
"request_id" : request_id ,
@@ -435,7 +440,7 @@ def setup(
435
440
"playVolume" : play_volume ,
436
441
},
437
442
}
438
-
443
+ cmd [ "data" ]. update ( kwargs )
439
444
success = self ._module_msg .send_cmd_and_wait_to_take_msg (
440
445
ujson .dumps (cmd ), request_id , self ._set_audio_work_id , 5000
441
446
)
@@ -468,6 +473,7 @@ def setup(
468
473
enoutput = False ,
469
474
response_format = "camera.raw" ,
470
475
request_id = "camera_setup" ,
476
+ ** kwargs ,
471
477
) -> str :
472
478
cmd = {
473
479
"request_id" : request_id ,
@@ -482,7 +488,7 @@ def setup(
482
488
"enoutput" : enoutput ,
483
489
},
484
490
}
485
-
491
+ cmd [ "data" ]. update ( kwargs )
486
492
success = self ._module_msg .send_cmd_and_wait_to_take_msg (
487
493
ujson .dumps (cmd ), request_id , self ._set_camera_work_id , 10000
488
494
)
@@ -517,6 +523,7 @@ def setup(
517
523
enoutput = False ,
518
524
enkws = False ,
519
525
request_id = "tts_setup" ,
526
+ ** kwargs ,
520
527
) -> str :
521
528
cmd = {
522
529
"request_id" : request_id ,
@@ -531,7 +538,7 @@ def setup(
531
538
"enkws" : enkws ,
532
539
},
533
540
}
534
-
541
+ cmd [ "data" ]. update ( kwargs )
535
542
success = self ._module_msg .send_cmd_and_wait_to_take_msg (
536
543
ujson .dumps (cmd ), request_id , self ._set_llm_work_id , 10000
537
544
)
@@ -588,6 +595,7 @@ def setup(
588
595
input = "tts.utf-8.stream" ,
589
596
enoutput = False ,
590
597
request_id = "melotts_setup" ,
598
+ ** kwargs ,
591
599
) -> str :
592
600
cmd = {
593
601
"request_id" : request_id ,
@@ -601,7 +609,7 @@ def setup(
601
609
"enoutput" : enoutput ,
602
610
},
603
611
}
604
-
612
+ cmd [ "data" ]. update ( kwargs )
605
613
success = self ._module_msg .send_cmd_and_wait_to_take_msg (
606
614
ujson .dumps (cmd ), request_id , self ._set_llm_work_id , 30000
607
615
)
@@ -658,6 +666,7 @@ def setup(
658
666
enoutput = True ,
659
667
enaudio = True ,
660
668
request_id = "kws_setup" ,
669
+ ** kwargs ,
661
670
) -> str :
662
671
cmd = {
663
672
"request_id" : request_id ,
@@ -673,7 +682,7 @@ def setup(
673
682
"kws" : kws ,
674
683
},
675
684
}
676
-
685
+ cmd [ "data" ]. update ( kwargs )
677
686
success = self ._module_msg .send_cmd_and_wait_to_take_msg (
678
687
ujson .dumps (cmd ), request_id , self ._set_llm_work_id , 30000
679
688
)
@@ -708,6 +717,7 @@ def setup(
708
717
rule2 = 1.2 ,
709
718
rule3 = 30.0 ,
710
719
request_id = "asr_setup" ,
720
+ ** kwargs ,
711
721
) -> str :
712
722
cmd = {
713
723
"request_id" : request_id ,
@@ -725,7 +735,7 @@ def setup(
725
735
"rule3" : rule3 ,
726
736
},
727
737
}
728
-
738
+ cmd [ "data" ]. update ( kwargs )
729
739
success = self ._module_msg .send_cmd_and_wait_to_take_msg (
730
740
ujson .dumps (cmd ), request_id , self ._set_llm_work_id , 10000
731
741
)
@@ -756,6 +766,7 @@ def setup(
756
766
input = "sys.pcm" ,
757
767
enoutput = True ,
758
768
request_id = "vad_setup" ,
769
+ ** kwargs ,
759
770
) -> str :
760
771
cmd = {
761
772
"request_id" : request_id ,
@@ -769,7 +780,7 @@ def setup(
769
780
"enoutput" : enoutput ,
770
781
},
771
782
}
772
-
783
+ cmd [ "data" ]. update ( kwargs )
773
784
success = self ._module_msg .send_cmd_and_wait_to_take_msg (
774
785
ujson .dumps (cmd ), request_id , self ._set_llm_work_id , 30000
775
786
)
@@ -801,6 +812,7 @@ def setup(
801
812
enoutput = True ,
802
813
language = "en" ,
803
814
request_id = "whisper_setup" ,
815
+ ** kwargs ,
804
816
) -> str :
805
817
cmd = {
806
818
"request_id" : request_id ,
@@ -815,7 +827,7 @@ def setup(
815
827
"enoutput" : enoutput ,
816
828
},
817
829
}
818
-
830
+ cmd [ "data" ]. update ( kwargs )
819
831
success = self ._module_msg .send_cmd_and_wait_to_take_msg (
820
832
ujson .dumps (cmd ), request_id , self ._set_llm_work_id , 30000
821
833
)
@@ -847,6 +859,7 @@ def setup(
847
859
input = "yolo.jpg.base64" ,
848
860
enoutput = True ,
849
861
request_id = "yolo_setup" ,
862
+ ** kwargs ,
850
863
) -> str :
851
864
cmd = {
852
865
"request_id" : request_id ,
@@ -860,7 +873,7 @@ def setup(
860
873
"enoutput" : enoutput ,
861
874
},
862
875
}
863
-
876
+ cmd [ "data" ]. update ( kwargs )
864
877
success = self ._module_msg .send_cmd_and_wait_to_take_msg (
865
878
ujson .dumps (cmd ), request_id , self ._set_yolo_work_id , 10000
866
879
)
@@ -1030,6 +1043,7 @@ def llm_setup(
1030
1043
enkws = None ,
1031
1044
max_token_len = 127 ,
1032
1045
request_id = "llm_setup" ,
1046
+ ** kwargs ,
1033
1047
) -> str :
1034
1048
if self .version == "v1.0" :
1035
1049
model = "qwen2.5-0.5b"
@@ -1048,7 +1062,15 @@ def llm_setup(
1048
1062
enkws = bool (enkws )
1049
1063
1050
1064
self .latest_llm_work_id = self .llm .setup (
1051
- prompt , model , response_format , input , enoutput , enkws , max_token_len , request_id
1065
+ prompt ,
1066
+ model ,
1067
+ response_format ,
1068
+ input ,
1069
+ enoutput ,
1070
+ enkws ,
1071
+ max_token_len ,
1072
+ request_id ,
1073
+ ** kwargs ,
1052
1074
)
1053
1075
return self .latest_llm_work_id
1054
1076
@@ -1066,6 +1088,7 @@ def vlm_setup(
1066
1088
enkws = None ,
1067
1089
max_token_len = 256 ,
1068
1090
request_id = "vlm_setup" ,
1091
+ ** kwargs ,
1069
1092
) -> str :
1070
1093
if input is None :
1071
1094
input = ["vlm.utf-8" ]
@@ -1076,7 +1099,7 @@ def vlm_setup(
1076
1099
input .append (enkws )
1077
1100
1078
1101
self .latest_vlm_work_id = self .vlm .setup (
1079
- prompt , model , response_format , input , enoutput , max_token_len , request_id
1102
+ prompt , model , response_format , input , enoutput , max_token_len , request_id , ** kwargs
1080
1103
)
1081
1104
return self .latest_vlm_work_id
1082
1105
@@ -1098,9 +1121,10 @@ def audio_setup(
1098
1121
playdevice = 1 ,
1099
1122
play_volume = 0.15 ,
1100
1123
request_id = "audio_setup" ,
1124
+ ** kwargs ,
1101
1125
) -> str :
1102
1126
self .latest_audio_work_id = self .audio .setup (
1103
- capcard , capdevice , cap_volume , playcard , playdevice , play_volume , request_id
1127
+ capcard , capdevice , cap_volume , playcard , playdevice , play_volume , request_id , ** kwargs
1104
1128
)
1105
1129
return self .latest_audio_work_id
1106
1130
@@ -1112,9 +1136,10 @@ def camera_setup(
1112
1136
frame_height = 320 ,
1113
1137
enoutput = False ,
1114
1138
response_format = "camera.raw" ,
1139
+ ** kwargs ,
1115
1140
) -> str :
1116
1141
self .latest_camera_work_id = self .camera .setup (
1117
- input , frame_width , frame_height , enoutput , response_format , request_id
1142
+ input , frame_width , frame_height , enoutput , response_format , request_id , ** kwargs
1118
1143
)
1119
1144
return self .latest_camera_work_id
1120
1145
@@ -1145,6 +1170,7 @@ def tts_setup(
1145
1170
enoutput = False ,
1146
1171
enkws = None ,
1147
1172
request_id = "tts_setup" ,
1173
+ ** kwargs ,
1148
1174
) -> str :
1149
1175
if self .version == "v1.0" :
1150
1176
response_format = "tts.base64.wav"
@@ -1165,7 +1191,7 @@ def tts_setup(
1165
1191
enkws = bool (enkws )
1166
1192
1167
1193
self .latest_tts_work_id = self .tts .setup (
1168
- model , response_format , input , enoutput , enkws , request_id
1194
+ model , response_format , input , enoutput , enkws , request_id , ** kwargs
1169
1195
)
1170
1196
return self .latest_tts_work_id
1171
1197
@@ -1182,6 +1208,7 @@ def melotts_setup(
1182
1208
enoutput = False ,
1183
1209
enkws = None ,
1184
1210
request_id = "melotts_setup" ,
1211
+ ** kwargs ,
1185
1212
) -> str :
1186
1213
if float (self .version .lstrip ("v" )) >= 1.6 and model == "melotts_zh-cn" :
1187
1214
model = "melotts-zh-cn"
@@ -1201,7 +1228,7 @@ def melotts_setup(
1201
1228
input .append (enkws )
1202
1229
1203
1230
self .latest_melotts_work_id = self .melotts .setup (
1204
- model , response_format , input , enoutput , request_id
1231
+ model , response_format , input , enoutput , request_id , ** kwargs
1205
1232
)
1206
1233
return self .latest_melotts_work_id
1207
1234
@@ -1219,11 +1246,12 @@ def kws_setup(
1219
1246
enoutput = True ,
1220
1247
enaudio = True ,
1221
1248
request_id = "kws_setup" ,
1249
+ ** kwargs ,
1222
1250
) -> str :
1223
1251
if language == "zh_CN" :
1224
1252
model = "sherpa-onnx-kws-zipformer-wenetspeech-3.3M-2024-01-01"
1225
1253
self .latest_kws_work_id = self .kws .setup (
1226
- kws , model , response_format , input , enoutput , enaudio , request_id
1254
+ kws , model , response_format , input , enoutput , enaudio , request_id , ** kwargs
1227
1255
)
1228
1256
return self .latest_kws_work_id
1229
1257
@@ -1239,6 +1267,7 @@ def asr_setup(
1239
1267
rule2 = 1.2 ,
1240
1268
rule3 = 30.0 ,
1241
1269
request_id = "asr_setup" ,
1270
+ ** kwargs ,
1242
1271
) -> str :
1243
1272
if input is None :
1244
1273
input = "sys.pcm" if self .version == "v1.0" else ["sys.pcm" ]
@@ -1255,7 +1284,16 @@ def asr_setup(
1255
1284
enkws = bool (enkws )
1256
1285
1257
1286
self .latest_asr_work_id = self .asr .setup (
1258
- model , response_format , input , enoutput , enkws , rule1 , rule2 , rule3 , request_id
1287
+ model ,
1288
+ response_format ,
1289
+ input ,
1290
+ enoutput ,
1291
+ enkws ,
1292
+ rule1 ,
1293
+ rule2 ,
1294
+ rule3 ,
1295
+ request_id ,
1296
+ ** kwargs ,
1259
1297
)
1260
1298
return self .latest_asr_work_id
1261
1299
@@ -1267,6 +1305,7 @@ def vad_setup(
1267
1305
enoutput = True ,
1268
1306
enkws = None ,
1269
1307
request_id = "kws_setup" ,
1308
+ ** kwargs ,
1270
1309
) -> str :
1271
1310
if input is None :
1272
1311
input = ["sys.pcm" ]
@@ -1275,7 +1314,7 @@ def vad_setup(
1275
1314
input = [input ]
1276
1315
input .append (enkws )
1277
1316
self .latest_vad_work_id = self .vad .setup (
1278
- model , response_format , input , enoutput , request_id
1317
+ model , response_format , input , enoutput , request_id , ** kwargs
1279
1318
)
1280
1319
return self .latest_vad_work_id
1281
1320
@@ -1289,6 +1328,7 @@ def whisper_setup(
1289
1328
enkws = None ,
1290
1329
envad = None ,
1291
1330
request_id = "asr_setup" ,
1331
+ ** kwargs ,
1292
1332
) -> str :
1293
1333
if input is None :
1294
1334
input = ["sys.pcm" ]
@@ -1301,7 +1341,7 @@ def whisper_setup(
1301
1341
input = [input ]
1302
1342
input .append (envad )
1303
1343
self .latest_whisper_work_id = self .whisper .setup (
1304
- model , response_format , input , enoutput , language , request_id
1344
+ model , response_format , input , enoutput , language , request_id , ** kwargs
1305
1345
)
1306
1346
return self .latest_whisper_work_id
1307
1347
0 commit comments