vtiw commited on
Commit
d4e9c7a
·
verified ·
1 Parent(s): cc5d0c7

Delete lang_list.py

Browse files
Files changed (1) hide show
  1. lang_list.py +0 -163
lang_list.py DELETED
@@ -1,163 +0,0 @@
1
- # Language dict
2
- language_code_to_name = {
3
- "afr": "Afrikaans",
4
- "amh": "Amharic",
5
- "arb": "Modern Standard Arabic",
6
- "ary": "Moroccan Arabic",
7
- "arz": "Egyptian Arabic",
8
- "asm": "Assamese",
9
- "ast": "Asturian",
10
- "azj": "North Azerbaijani",
11
- "bel": "Belarusian",
12
- "ben": "Bengali",
13
- "bos": "Bosnian",
14
- "bul": "Bulgarian",
15
- "cat": "Catalan",
16
- "ceb": "Cebuano",
17
- "ces": "Czech",
18
- "ckb": "Central Kurdish",
19
- "cmn": "Mandarin Chinese",
20
- "cym": "Welsh",
21
- "dan": "Danish",
22
- "deu": "German",
23
- "ell": "Greek",
24
- "eng": "English",
25
- "est": "Estonian",
26
- "eus": "Basque",
27
- "fin": "Finnish",
28
- "fra": "French",
29
- "gaz": "West Central Oromo",
30
- "gle": "Irish",
31
- "glg": "Galician",
32
- "guj": "Gujarati",
33
- "heb": "Hebrew",
34
- "hin": "Hindi",
35
- "hrv": "Croatian",
36
- "hun": "Hungarian",
37
- "hye": "Armenian",
38
- "ibo": "Igbo",
39
- "ind": "Indonesian",
40
- "isl": "Icelandic",
41
- "ita": "Italian",
42
- "jav": "Javanese",
43
- "jpn": "Japanese",
44
- "kam": "Kamba",
45
- "kan": "Kannada",
46
- "kat": "Georgian",
47
- "kaz": "Kazakh",
48
- "kea": "Kabuverdianu",
49
- "khk": "Halh Mongolian",
50
- "khm": "Khmer",
51
- "kir": "Kyrgyz",
52
- "kor": "Korean",
53
- "lao": "Lao",
54
- "lit": "Lithuanian",
55
- "ltz": "Luxembourgish",
56
- "lug": "Ganda",
57
- "luo": "Luo",
58
- "lvs": "Standard Latvian",
59
- "mai": "Maithili",
60
- "mal": "Malayalam",
61
- "mar": "Marathi",
62
- "mkd": "Macedonian",
63
- "mlt": "Maltese",
64
- "mni": "Meitei",
65
- "mya": "Burmese",
66
- "nld": "Dutch",
67
- "nno": "Norwegian Nynorsk",
68
- "nob": "Norwegian Bokm\u00e5l",
69
- "npi": "Nepali",
70
- "nya": "Nyanja",
71
- "oci": "Occitan",
72
- "ory": "Odia",
73
- "pan": "Punjabi",
74
- "pbt": "Southern Pashto",
75
- "pes": "Western Persian",
76
- "pol": "Polish",
77
- "por": "Portuguese",
78
- "ron": "Romanian",
79
- "rus": "Russian",
80
- "slk": "Slovak",
81
- "slv": "Slovenian",
82
- "sna": "Shona",
83
- "snd": "Sindhi",
84
- "som": "Somali",
85
- "spa": "Spanish",
86
- "srp": "Serbian",
87
- "swe": "Swedish",
88
- "swh": "Swahili",
89
- "tam": "Tamil",
90
- "tel": "Telugu",
91
- "tgk": "Tajik",
92
- "tgl": "Tagalog",
93
- "tha": "Thai",
94
- "tur": "Turkish",
95
- "ukr": "Ukrainian",
96
- "urd": "Urdu",
97
- "uzn": "Northern Uzbek",
98
- "vie": "Vietnamese",
99
- "xho": "Xhosa",
100
- "yor": "Yoruba",
101
- "yue": "Cantonese",
102
- "zlm": "Colloquial Malay",
103
- "zsm": "Standard Malay",
104
- "zul": "Zulu",
105
- }
106
- LANGUAGE_NAME_TO_CODE = {v: k for k, v in language_code_to_name.items()}
107
-
108
- # Source langs: S2ST / S2TT / ASR don't need source lang
109
- # T2TT / T2ST use this
110
- text_source_language_codes = [
111
- "hin",
112
- "pan",
113
- "eng",
114
- ]
115
- TEXT_SOURCE_LANGUAGE_NAMES = sorted([language_code_to_name[code] for code in text_source_language_codes])
116
-
117
- # Target langs:
118
- # S2ST / T2ST
119
- s2st_target_language_codes = [
120
- "eng",
121
- "arb",
122
- "ben",
123
- "cat",
124
- "ces",
125
- "cmn",
126
- "cym",
127
- "dan",
128
- "deu",
129
- "est",
130
- "fin",
131
- "fra",
132
- "hin",
133
- "ind",
134
- "ita",
135
- "jpn",
136
- "kor",
137
- "mlt",
138
- "nld",
139
- "pes",
140
- "pol",
141
- "por",
142
- "ron",
143
- "rus",
144
- "slk",
145
- "spa",
146
- "swe",
147
- "swh",
148
- "tel",
149
- "tgl",
150
- "tha",
151
- "tur",
152
- "ukr",
153
- "urd",
154
- "uzn",
155
- "vie",
156
- ]
157
- S2ST_TARGET_LANGUAGE_NAMES = sorted([language_code_to_name[code] for code in s2st_target_language_codes])
158
- T2ST_TARGET_LANGUAGE_NAMES = S2ST_TARGET_LANGUAGE_NAMES
159
-
160
- # S2TT / T2TT / ASR
161
- S2TT_TARGET_LANGUAGE_NAMES = TEXT_SOURCE_LANGUAGE_NAMES
162
- T2TT_TARGET_LANGUAGE_NAMES = TEXT_SOURCE_LANGUAGE_NAMES
163
- ASR_TARGET_LANGUAGE_NAMES = TEXT_SOURCE_LANGUAGE_NAMES