Spaces:
Build error
Build error
Update app.py
Browse files
app.py
CHANGED
|
@@ -6,6 +6,84 @@ from transformers import pipeline
|
|
| 6 |
|
| 7 |
pipe = pipeline("translation", model="facebook/nllb-200-distilled-600M", torch_dtype = torch.bfloat16)
|
| 8 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 9 |
def get_fores_code(language):
|
| 10 |
# Loop through the list of languages
|
| 11 |
for entry in languages['languages']:
|
|
|
|
| 6 |
|
| 7 |
pipe = pipeline("translation", model="facebook/nllb-200-distilled-600M", torch_dtype = torch.bfloat16)
|
| 8 |
|
| 9 |
+
languages = {
|
| 10 |
+
"languages": [
|
| 11 |
+
{"name": "Acehnese (Arabic script)", "code": "ace_Arab"},
|
| 12 |
+
{"name": "Acehnese (Latin script)", "code": "ace_Latn"},
|
| 13 |
+
{"name": "Mesopotamian Arabic", "code": "acm_Arab"},
|
| 14 |
+
{"name": "Ta’izzi-Adeni Arabic", "code": "acq_Arab"},
|
| 15 |
+
{"name": "Tunisian Arabic", "code": "aeb_Arab"},
|
| 16 |
+
{"name": "Afrikaans", "code": "afr_Latn"},
|
| 17 |
+
{"name": "South Levantine Arabic", "code": "ajp_Arab"},
|
| 18 |
+
{"name": "Akan", "code": "aka_Latn"},
|
| 19 |
+
{"name": "Amharic", "code": "amh_Ethi"},
|
| 20 |
+
{"name": "North Levantine Arabic", "code": "apc_Arab"},
|
| 21 |
+
{"name": "Modern Standard Arabic", "code": "arb_Arab"},
|
| 22 |
+
{"name": "Modern Standard Arabic (Romanized)", "code": "arb_Latn"},
|
| 23 |
+
{"name": "Najdi Arabic", "code": "ars_Arab"},
|
| 24 |
+
{"name": "Moroccan Arabic", "code": "ary_Arab"},
|
| 25 |
+
{"name": "Egyptian Arabic", "code": "arz_Arab"},
|
| 26 |
+
{"name": "Assamese", "code": "asm_Beng"},
|
| 27 |
+
{"name": "Asturian", "code": "ast_Latn"},
|
| 28 |
+
{"name": "Awadhi", "code": "awa_Deva"},
|
| 29 |
+
{"name": "Central Aymara", "code": "ayr_Latn"},
|
| 30 |
+
{"name": "South Azerbaijani", "code": "azb_Arab"},
|
| 31 |
+
{"name": "North Azerbaijani", "code": "azj_Latn"},
|
| 32 |
+
{"name": "Bashkir", "code": "bak_Cyrl"},
|
| 33 |
+
{"name": "Bambara", "code": "bam_Latn"},
|
| 34 |
+
{"name": "Balinese", "code": "ban_Latn"},
|
| 35 |
+
{"name": "Belarusian", "code": "bel_Cyrl"},
|
| 36 |
+
{"name": "Bemba", "code": "bem_Latn"},
|
| 37 |
+
{"name": "Bengali", "code": "ben_Beng"},
|
| 38 |
+
{"name": "Bhojpuri", "code": "bho_Deva"},
|
| 39 |
+
{"name": "Banjar (Arabic script)", "code": "bjn_Arab"},
|
| 40 |
+
{"name": "Banjar (Latin script)", "code": "bjn_Latn"},
|
| 41 |
+
{"name": "Standard Tibetan", "code": "bod_Tibt"},
|
| 42 |
+
{"name": "Bosnian", "code": "bos_Latn"},
|
| 43 |
+
{"name": "Buginese", "code": "bug_Latn"},
|
| 44 |
+
{"name": "Bulgarian", "code": "bul_Cyrl"},
|
| 45 |
+
{"name": "Catalan", "code": "cat_Latn"},
|
| 46 |
+
{"name": "Cebuano", "code": "ceb_Latn"},
|
| 47 |
+
{"name": "Czech", "code": "ces_Latn"},
|
| 48 |
+
{"name": "Chokwe", "code": "cjk_Latn"},
|
| 49 |
+
{"name": "Central Kurdish", "code": "ckb_Arab"},
|
| 50 |
+
{"name": "Crimean Tatar", "code": "crh_Latn"},
|
| 51 |
+
{"name": "Welsh", "code": "cym_Latn"},
|
| 52 |
+
{"name": "Danish", "code": "dan_Latn"},
|
| 53 |
+
{"name": "German", "code": "deu_Latn"},
|
| 54 |
+
{"name": "Southwestern Dinka", "code": "dik_Latn"},
|
| 55 |
+
{"name": "Dyula", "code": "dyu_Latn"},
|
| 56 |
+
{"name": "Dzongkha", "code": "dzo_Tibt"},
|
| 57 |
+
{"name": "Greek", "code": "ell_Grek"},
|
| 58 |
+
{"name": "English", "code": "eng_Latn"},
|
| 59 |
+
{"name": "Esperanto", "code": "epo_Latn"},
|
| 60 |
+
{"name": "Estonian", "code": "est_Latn"},
|
| 61 |
+
{"name": "Basque", "code": "eus_Latn"},
|
| 62 |
+
{"name": "Ewe", "code": "ewe_Latn"},
|
| 63 |
+
{"name": "Faroese", "code": "fao_Latn"},
|
| 64 |
+
{"name": "Fijian", "code": "fij_Latn"},
|
| 65 |
+
{"name": "Finnish", "code": "fin_Latn"},
|
| 66 |
+
{"name": "Fon", "code": "fon_Latn"},
|
| 67 |
+
{"name": "French", "code": "fra_Latn"},
|
| 68 |
+
{"name": "Friulian", "code": "fur_Latn"},
|
| 69 |
+
{"name": "Nigerian Fulfulde", "code": "fuv_Latn"},
|
| 70 |
+
{"name": "Scottish Gaelic", "code": "gla_Latn"},
|
| 71 |
+
{"name": "Irish", "code": "gle_Latn"},
|
| 72 |
+
{"name": "Galician", "code": "glg_Latn"},
|
| 73 |
+
{"name": "Guarani", "code": "grn_Latn"},
|
| 74 |
+
{"name": "Gujarati", "code": "guj_Gujr"},
|
| 75 |
+
{"name": "Haitian Creole", "code": "hat_Latn"},
|
| 76 |
+
{"name": "Hausa", "code": "hau_Latn"},
|
| 77 |
+
{"name": "Hebrew", "code": "heb_Hebr"},
|
| 78 |
+
{"name": "Hindi", "code": "hin_Deva"},
|
| 79 |
+
{"name": "Chhattisgarhi", "code": "hne_Deva"},
|
| 80 |
+
{"name": "Croatian", "code": "hrv_Latn"},
|
| 81 |
+
{"name": "Hungarian", "code": "hun_Latn"},
|
| 82 |
+
{"name": "Armenian", "code": "hye_Armn"},
|
| 83 |
+
{"name": "Igbo", "code": "ibo_Latn"}
|
| 84 |
+
]
|
| 85 |
+
}
|
| 86 |
+
|
| 87 |
def get_fores_code(language):
|
| 88 |
# Loop through the list of languages
|
| 89 |
for entry in languages['languages']:
|