@@ -125,14 +125,11 @@ class FasterWhisperSTT(STT):
125125
126126 def __init__ (self , * args , ** kwargs ):
127127 super ().__init__ (* args , ** kwargs )
128- model = self .config .get ("model" ) or "whisper-large-v3-turbo"
129- if model == "whisper-large-v3-turbo" :
130- model = "deepdml/faster-whisper-large-v3-turbo-ct2"
131- else :
132- valid_model = model in FasterWhisperSTT .MODELS
133- if not valid_model :
134- LOG .info (f"{ model } is not default model_id ({ FasterWhisperSTT .MODELS } ), "
135- f"assuming huggingface repo_id or path to local model" )
128+ model = self .config .get ("model" ) or "large-v3-turbo"
129+ valid_model = model in FasterWhisperSTT .MODELS
130+ if not valid_model :
131+ LOG .info (f"{ model } is not default model_id ({ FasterWhisperSTT .MODELS } ), "
132+ f"assuming huggingface repo_id or path to local model" )
136133
137134 self .beam_size = self .config .get ("beam_size" , 5 )
138135 self .compute_type = self .config .get ("compute_type" , "int8" )
@@ -210,40 +207,20 @@ def execute(self, audio, language=None):
210207
211208 @classproperty
212209 def available_languages (cls ) -> set :
213- return set (FasterWhisperSTT .LANGUAGES .keys ())
210+ return set (cls .LANGUAGES .keys ())
214211
215212
216213FasterWhisperSTTConfig = {
217- lang : [
218- {
219- "model" : "tiny" ,
220- "lang" : lang ,
221- "meta" : {
222- "priority" : 50 ,
223- "display_name" : "FasterWhisper (Tiny)" ,
224- "offline" : True ,
225- },
226- },
227- {
228- "model" : "base" ,
229- "lang" : lang ,
230- "meta" : {
231- "priority" : 55 ,
232- "display_name" : f"FasterWhisper (Base)" ,
233- "offline" : True ,
234- },
235- },
236- {
237- "model" : "small" ,
238- "lang" : lang ,
239- "meta" : {
240- "priority" : 60 ,
241- "display_name" : f"FasterWhisper (Small)" ,
242- "offline" : True ,
243- },
214+ lang : [{
215+ "model" : model ,
216+ "lang" : lang ,
217+ "meta" : {
218+ "priority" : 50 ,
219+ "display_name" : f"FasterWhisper ({ model } )" ,
220+ "offline" : True ,
244221 },
245- ]
246- for lang , lang_name in FasterWhisperSTT .LANGUAGES . items ()
222+ } for model in FasterWhisperSTT . MODELS ]
223+ for lang in FasterWhisperSTT .available_languages
247224}
248225
249226if __name__ == "__main__" :
@@ -259,7 +236,7 @@ def available_languages(cls) -> set:
259236
260237 from speech_recognition import Recognizer , AudioFile
261238
262- jfk = "/home/miro/PycharmProjects/OVOS/STT/ovos-stt-plugin-fasterwhisper/ jfk.wav"
239+ jfk = "jfk.wav"
263240 with AudioFile (jfk ) as source :
264241 audio = Recognizer ().record (source )
265242
0 commit comments