TiberiuCristianLeon commited on
Commit
0d00ebd
·
verified ·
1 Parent(s): 8b76c73

Update languagecodes.py

Browse files
Files changed (1) hide show
  1. languagecodes.py +110 -0
languagecodes.py CHANGED
@@ -258,4 +258,114 @@ mbart_large_languages = {
258
  'Galician': 'gl_ES',
259
  'Slovene': 'sl_SI'
260
  }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
261
 
 
258
  'Galician': 'gl_ES',
259
  'Slovene': 'sl_SI'
260
  }
261
+ # language code system: ISO 639-1 standard, two-letter codes to represent languages
262
+ iso_languages = {
263
+ "Afrikaans": "af",
264
+ "Albanian": "sq",
265
+ "Amharic": "am",
266
+ "Arabic": "ar",
267
+ "Armenian": "hy",
268
+ "Azerbaijani": "az",
269
+ "Basque": "eu",
270
+ "Belarusian": "be",
271
+ "Bengali": "bn",
272
+ "Bosnian": "bs",
273
+ "Bulgarian": "bg",
274
+ "Catalan": "ca",
275
+ "Cebuano": "ceb",
276
+ "Chinese (Simplified)": "zh-CN",
277
+ "Chinese (Traditional)": "zh-TW",
278
+ "Corsican": "co",
279
+ "Croatian": "hr",
280
+ "Czech": "cs",
281
+ "Danish": "da",
282
+ "Dutch": "nl",
283
+ "English": "en",
284
+ "Esperanto": "eo",
285
+ "Estonian": "et",
286
+ "Finnish": "fi",
287
+ "French": "fr",
288
+ "Galician": "gl",
289
+ "Georgian": "ka",
290
+ "German": "de",
291
+ "Greek": "el",
292
+ "Gujarati": "gu",
293
+ "Haitian Creole": "ht",
294
+ "Hausa": "ha",
295
+ "Hawaiian": "haw",
296
+ "Hebrew": "he",
297
+ "Hindi": "hi",
298
+ "Hungarian": "hu",
299
+ "Icelandic": "is",
300
+ "Igbo": "ig",
301
+ "Indonesian": "id",
302
+ "Irish": "ga",
303
+ "Italian": "it",
304
+ "Japanese": "ja",
305
+ "Javanese": "jv",
306
+ "Kannada": "kn",
307
+ "Kazakh": "kk",
308
+ "Khmer": "km",
309
+ "Kinyarwanda": "rw",
310
+ "Korean": "ko",
311
+ "Kurdish (Kurmanji)": "ku",
312
+ "Kyrgyz": "ky",
313
+ "Lao": "lo",
314
+ "Latin": "la",
315
+ "Latvian": "lv",
316
+ "Lithuanian": "lt",
317
+ "Luxembourgish": "lb",
318
+ "Macedonian": "mk",
319
+ "Malagasy": "mg",
320
+ "Malay": "ms",
321
+ "Malayalam": "ml",
322
+ "Maltese": "mt",
323
+ "Maori": "mi",
324
+ "Marathi": "mr",
325
+ "Mongolian": "mn",
326
+ "Myanmar (Burmese)": "my",
327
+ "Nepali": "ne",
328
+ "Norwegian": "no",
329
+ "Nyanja (Chichewa)": "ny",
330
+ "Odia (Oriya)": "or",
331
+ "Pashto": "ps",
332
+ "Persian": "fa",
333
+ "Polish": "pl",
334
+ "Portuguese": "pt",
335
+ "Punjabi": "pa",
336
+ "Romanian": "ro",
337
+ "Russian": "ru",
338
+ "Samoan": "sm",
339
+ "Scots Gaelic": "gd",
340
+ "Serbian": "sr",
341
+ "Sesotho": "st",
342
+ "Shona": "sn",
343
+ "Sindhi": "sd",
344
+ "Sinhala": "si",
345
+ "Slovak": "sk",
346
+ "Slovenian": "sl",
347
+ "Somali": "so",
348
+ "Spanish": "es",
349
+ "Sundanese": "su",
350
+ "Swahili": "sw",
351
+ "Swedish": "sv",
352
+ "Tagalog (Filipino)": "tl",
353
+ "Tajik": "tg",
354
+ "Tamil": "ta",
355
+ "Tatar": "tt",
356
+ "Telugu": "te",
357
+ "Thai": "th",
358
+ "Turkish": "tr",
359
+ "Turkmen": "tk",
360
+ "Ukrainian": "uk",
361
+ "Urdu": "ur",
362
+ "Uyghur": "ug",
363
+ "Uzbek": "uz",
364
+ "Vietnamese": "vi",
365
+ "Welsh": "cy",
366
+ "Xhosa": "xh",
367
+ "Yiddish": "yi",
368
+ "Yoruba": "yo",
369
+ "Zulu": "zu"
370
+ }
371