OVOS plugin for Wav2Vec2
pip install ovos-stt-plugin-wav2vec
"stt": {
"module": "ovos-stt-plugin-wav2vec",
"ovos-stt-plugin-wav2vec": {
"model": "proxectonos/Nos_ASR-wav2vec2-large-xlsr-53-gl-with-lm"
}
}"model" can be any compatible wav2vec2 model from hugging face, if not set, it will be automatically selected based on language
If your language is not supported you can use
"facebook/mms-1b-all", but in that case check out the dedicated plugin ovos-stt-plugin-mms
Supported languages: 'ab', 'ar', 'as', 'ba', 'bas', 'bg', 'bn', 'br', 'ca', 'cnh', 'cv', 'cy',
'cz', 'da', 'de', 'el', 'en', 'eo', 'es', 'fa', 'fi', 'fr', 'ga', 'gl', 'gn', 'ha', 'he',
'hi', 'hk', 'hu', 'hy', 'ia', 'id', 'it', 'jp', 'jv', 'ka', 'ko', 'ku', 'ky', 'lb', 'lg',
'lt', 'ml', 'mn', 'mr', 'mt', 'ne', 'nl', 'or', 'pa', 'pl', 'pt', 'rm-sursilv', 'rm-vallader',
'ro', 'ru', 'sah', 'sk', 'sl', 'su', 'sv', 'sw', 'ta', 'te', 'tr', 'tt', 'uk', 'ur', 'vi', 'zh'
LANG2MODEL = {
"gl": "proxectonos/Nos_ASR-wav2vec2-large-xlsr-53-gl-with-lm",
"pt": "jonatasgrosman/wav2vec2-large-xlsr-53-portuguese",
"en": "jonatasgrosman/wav2vec2-large-xlsr-53-english",
"zh": "jonatasgrosman/wav2vec2-large-xlsr-53-chinese-zh-cn",
"ru": "jonatasgrosman/wav2vec2-large-xlsr-53-russian",
"it": "jonatasgrosman/wav2vec2-large-xlsr-53-italian",
"es": "jonatasgrosman/wav2vec2-large-xlsr-53-spanish",
"fr": "jonatasgrosman/wav2vec2-large-xlsr-53-french",
"de": "jonatasgrosman/wav2vec2-large-xlsr-53-german",
"nl": "jonatasgrosman/wav2vec2-large-xlsr-53-dutch",
"jp": "jonatasgrosman/wav2vec2-large-xlsr-53-japanese",
"pl": "jonatasgrosman/wav2vec2-large-xlsr-53-polish",
"hu": "jonatasgrosman/wav2vec2-large-xlsr-53-hungarian",
"ar": "jonatasgrosman/wav2vec2-large-xlsr-53-arabic",
"fi": "jonatasgrosman/wav2vec2-large-xlsr-53-finnish",
"fa": "jonatasgrosman/wav2vec2-large-xlsr-53-persian",
"el": "jonatasgrosman/wav2vec2-large-xlsr-53-greek",
"ia": "infinitejoy/wav2vec2-large-xls-r-300m-interlingua",
"cnh": "infinitejoy/wav2vec2-large-xls-r-300m-hakha-chin",
"ta": "infinitejoy/wav2vec2-large-xls-r-300m-tamil-cv8",
"or": "infinitejoy/wav2vec2-large-xls-r-300m-odia",
"gn": "infinitejoy/wav2vec2-large-xls-r-300m-guarani",
"cy": "infinitejoy/wav2vec2-large-xls-r-300m-welsh",
"ur": "infinitejoy/wav2vec2-large-xls-r-300m-urdu",
"ab": "infinitejoy/wav2vec2-large-xls-r-300m-abkhaz",
"ba": "infinitejoy/wav2vec2-large-xls-r-300m-bashkir",
"bas": "infinitejoy/wav2vec2-large-xls-r-300m-basaa",
"sah": "infinitejoy/wav2vec2-large-xls-r-300m-sakha",
"mr": "infinitejoy/wav2vec2-large-xls-r-300m-marathi-cv8",
"lt": "infinitejoy/wav2vec2-large-xls-r-300m-lithuanian",
"ha": "infinitejoy/wav2vec2-large-xls-r-300m-hausa",
"br": "infinitejoy/wav2vec2-large-xls-r-300m-breton",
"cv": "infinitejoy/wav2vec2-large-xls-r-300m-chuvash",
"hy": "infinitejoy/wav2vec2-large-xls-r-300m-armenian",
"mt": "infinitejoy/wav2vec2-large-xls-r-300m-maltese",
"as": "infinitejoy/wav2vec2-large-xls-r-300m-assamese",
"tt": "infinitejoy/wav2vec2-large-xls-r-300m-tatar",
"ky": "infinitejoy/wav2vec2-large-xls-r-300m-kyrgyz",
"ga": "infinitejoy/wav2vec2-large-xls-r-300m-irish",
"ka": "infinitejoy/wav2vec2-large-xls-r-300m-georgian",
"sk": "infinitejoy/wav2vec2-large-xls-r-300m-slovak",
"sl": "infinitejoy/wav2vec2-large-xls-r-300m-slovenian",
"mn": "infinitejoy/wav2vec2-large-xls-r-300m-mongolian",
"ro": "infinitejoy/wav2vec2-large-xls-r-300m-romanian",
"ku": "infinitejoy/wav2vec2-large-xls-r-300m-kurdish",
"bg": "infinitejoy/wav2vec2-large-xls-r-300m-bulgarian",
"hi": "infinitejoy/wav2vec2-large-xls-r-300m-hindi",
"rm-vallader": "infinitejoy/wav2vec2-large-xls-r-300m-romansh-vallader",
"rm-sursilv": "infinitejoy/wav2vec2-large-xls-r-300m-romansh-sursilvan",
# "fi": "infinitejoy/wav2vec2-large-xls-r-300m-finnish",
# "hu": "infinitejoy/wav2vec2-large-xls-r-300m-hungarian",
# "el": "infinitejoy/wav2vec2-large-xls-r-300m-greek",
# "gl": "infinitejoy/wav2vec2-large-xls-r-300m-galician",
# "ar": "infinitejoy/wav2vec2-large-xls-r-300m-arabic",
# "id": "infinitejoy/wav2vec2-large-xls-r-300m-indonesian",
"id": "indonesian-nlp/wav2vec2-large-xlsr-indonesian",
"lg": "indonesian-nlp/wav2vec2-luganda",
"jv": "indonesian-nlp/wav2vec2-indonesian-javanese-sundanese",
"su": "indonesian-nlp/wav2vec2-indonesian-javanese-sundanese",
"da": "vachonni/wav2vec2-large-xls-r-300m-dansk-CV-80",
"ml": "Bluecast/wav2vec2-Malayalam",
"hk": "voidful/wav2vec2-large-xlsr-53-hk",
"ko": "kresnik/wav2vec2-large-xlsr-korean",
"vi": "nguyenvulebinh/wav2vec2-base-vietnamese-250h",
"bn": "arijitx/wav2vec2-large-xlsr-bengali",
"eo": "cpierse/wav2vec2-large-xlsr-53-esperanto",
"lb": "Lemswasabi/wav2vec2-large-xlsr-53-842h-luxembourgish-14h-with-lm",
"te": "anuragshas/wav2vec2-large-xlsr-53-telugu",
"tr": "mpoyraz/wav2vec2-xls-r-300m-cv7-turkish",
"ne": "gagan3012/wav2vec2-xlsr-nepali",
"he": "imvladikon/wav2vec2-large-xlsr-53-hebrew",
"sv": "KBLab/wav2vec2-large-xlsr-53-swedish",
"ca": "PereLluis13/wav2vec2-xls-r-1b-ca-lm",
"cz": "arampacha/wav2vec2-large-xlsr-czech",
"sw": "alokmatta/wav2vec2-large-xlsr-53-sw",
"uk": "arampacha/wav2vec2-xls-r-1b-uk",
"pa": "kingabzpro/wav2vec2-large-xlsr-53-punjabi",
}This plugin was funded by the Ministerio para la Transformación Digital y de la Función Pública and Plan de Recuperación, Transformación y Resiliencia - Funded by EU – NextGenerationEU within the framework of the project ILENIA with reference 2022/TL22/00215337
O Proxecto Nós é un proxecto da Xunta de Galicia cuxa execución foi encomendada á Universidade de Santiago de Compostela, a través de dúas entidades punteiras de investigación en intelixencia artificial e tecnoloxías da linguaxe: o ILG (Instituto da Lingua Galega) e o CiTIUS (Centro Singular de Investigación en Tecnoloxías Intelixentes).

