Skip to content

Commit 3733b1b

Browse files
committed
Add missing languages to AUDIO_LANGUAGES constant and remove languages not supported by WhisperX
1 parent 4843c62 commit 3733b1b

File tree

1 file changed

+54
-28
lines changed

1 file changed

+54
-28
lines changed

src/utils/constants.py

Lines changed: 54 additions & 28 deletions
Original file line numberDiff line numberDiff line change
@@ -6,77 +6,103 @@
66
"af": "Afrikaans",
77
"am": "Amharic",
88
"ar": "Arabic",
9-
"hy": "Armenian",
9+
"as": "Assamese",
1010
"az": "Azerbaijan",
11-
"eu": "Basque",
11+
"ba": "Bashkir",
1212
"be": "Belarusian",
13-
"bn": "Bengali",
1413
"bg": "Bulgarian",
14+
"bn": "Bengali",
15+
"bo": "Tibetan",
16+
"br": "Breton",
17+
"bs": "Bosnian",
1518
"ca": "Catalan",
16-
"zh": "Chinese (China)",
17-
"zh_HK": "Chinese (Hong Kong)",
18-
"zh_TW": "Chinese (Taiwan)",
19-
"hr": "Croatian",
2019
"cs": "Czech",
20+
"cy": "Welsh",
2121
"da": "Danish",
22-
"nl": "Dutch",
22+
"de": "German",
23+
"el": "Greek",
2324
"en": "English",
25+
"es": "Spanish",
2426
"et": "Estonian",
27+
"eu": "Basque",
2528
"fa": "Farsi",
26-
"fil": "Filipino",
2729
"fi": "Finnish",
30+
"fo": "Faroese",
2831
"fr": "French",
2932
"gl": "Galician",
30-
"ka": "Georgian",
31-
"de": "German",
32-
"de_CH": "German (Swiss Standard)",
33-
"el": "Greek",
3433
"gu": "Gujarati",
35-
"iw": "Hebrew",
34+
"ha": "Hausa",
35+
"haw": "Hawaiian",
36+
"he": "Hebrew",
3637
"hi": "Hindi",
38+
"hr": "Croatian",
39+
"ht": "Haitian",
3740
"hu": "Hungarian",
38-
"is": "Icelandic",
41+
"hy": "Armenian",
3942
"id": "Indonesian",
43+
"is": "Icelandic",
4044
"it": "Italian",
41-
"it_CH": "Swiss Italian",
4245
"ja": "Japanese",
43-
"jv": "Javanese",
44-
"kn": "Kannada",
46+
"jw": "Javanese",
47+
"ka": "Georgian",
4548
"kk": "Kazakh",
4649
"km": "Khmer",
50+
"kn": "Kannada",
4751
"ko": "Korean",
52+
"la": "Latin",
53+
"lb": "Luxembourgish",
54+
"ln": "Lingala",
4855
"lo": "Lao",
49-
"lv": "Latvian",
5056
"lt": "Lithuanian",
51-
"ms": "Malay",
57+
"lv": "Latvian",
58+
"mg": "Malagasy",
59+
"mi": "Maori",
60+
"mk": "Macedonian",
5261
"ml": "Malayalam",
53-
"mt": "Maltese",
54-
"mr": "Marathi",
5562
"mn": "Mongolian",
63+
"mr": "Marathi",
64+
"ms": "Malay",
65+
"mt": "Maltese",
66+
"my": "Burmese",
5667
"ne": "Nepali",
57-
"no": "Norwegian",
68+
"nl": "Dutch",
5869
"nn": "Norwegian Nynorsk",
70+
"no": "Norwegian",
71+
"oc": "Occitan",
72+
"pa": "Punjabi",
5973
"pl": "Polish",
74+
"ps": "Pashto",
6075
"pt": "Português",
61-
"pa": "Punjabi",
6276
"ro": "Romanian",
6377
"ru": "Russian",
64-
"sr": "Serbian",
78+
"sa": "Sanskrit",
79+
"sd": "Sindhi",
6580
"si": "Sinhala",
6681
"sk": "Slovak",
6782
"sl": "Slovenian",
68-
"es": "Spanish",
83+
"sn": "Shona",
84+
"so": "Somali",
85+
"sq": "Albanian",
86+
"sr": "Serbian",
6987
"su": "Sundanese",
70-
"sw": "Swahili",
7188
"sv": "Swedish",
89+
"sw": "Swahili",
7290
"ta": "Tamil",
7391
"te": "Telugu",
92+
"tg": "Tajik",
7493
"th": "Thai",
94+
"tk": "Turkmen",
95+
"tl": "Tagalog",
7596
"tr": "Turkish",
97+
"tt": "Tatar",
7698
"uk": "Ukrainian",
7799
"ur": "Urdu",
100+
"uz": "Uzbek",
78101
"vi": "Vietnamese",
79-
"zu": "Zulu",
102+
"yi": "Yiddish",
103+
"yo": "Yoruba",
104+
"yue": "Chinese (Yue)",
105+
"zh": "Chinese",
80106
}
81107

82108
AUDIO_FILE_EXTENSIONS = [

0 commit comments

Comments
 (0)