koichi12 commited on Nov 28, 2024

Commit

735d58a

verified ·

1 Parent(s): 9ae4866

Add files using upload-large-folder tool

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/README.md +49 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/_belebele.yaml +133 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_acm_Arab.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_afr_Latn.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_als_Latn.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_apc_Arab.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_arb_Latn.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_ars_Arab.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_arz_Arab.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_asm_Beng.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_bam_Latn.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_ben_Beng.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_bul_Cyrl.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_cat_Latn.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_ceb_Latn.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_ckb_Arab.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_dan_Latn.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_deu_Latn.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_eng_Latn.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_est_Latn.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_fin_Latn.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_fuv_Latn.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_gaz_Latn.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_grn_Latn.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_guj_Gujr.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_hat_Latn.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_heb_Hebr.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_hin_Deva.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_hun_Latn.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_ibo_Latn.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_ilo_Latn.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_ind_Latn.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_ita_Latn.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_jav_Latn.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_kac_Latn.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_kat_Geor.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_kea_Latn.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_khk_Cyrl.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_kin_Latn.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_kir_Cyrl.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_lit_Latn.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_lug_Latn.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_luo_Latn.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_lvs_Latn.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_mal_Mlym.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_mar_Deva.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_mlt_Latn.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_mri_Latn.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_npi_Latn.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_nso_Latn.yaml +4 -0

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/README.md ADDED Viewed

	@@ -0,0 +1,49 @@

+# Belebele
+### Paper
+The Belebele Benchmark for Massively Multilingual NLU Evaluation
+https://arxiv.org/abs/2308.16884
+Belebele is a multiple-choice machine reading comprehension (MRC) dataset spanning 122 language variants. This dataset enables the evaluation of mono- and multi-lingual models in high-, medium-, and low-resource languages. Each question has four multiple-choice answers and is linked to a short passage from the FLORES-200 dataset. The human annotation procedure was carefully curated to create questions that discriminate between different levels of generalizable language comprehension and is reinforced by extensive quality checks. While all questions directly relate to the passage, the English dataset on its own proves difficult enough to challenge state-of-the-art language models. Being fully parallel, this dataset enables direct comparison of model performance across all languages. Belebele opens up new avenues for evaluating and analyzing the multilingual abilities of language models and NLP systems.
+Homepage: https://github.com/facebookresearch/belebele
+### Citation
+```bibtex
+@misc{bandarkar2023belebele,
+      title={The Belebele Benchmark: a Parallel Reading Comprehension Dataset in 122 Language Variants},
+      author={Lucas Bandarkar and Davis Liang and Benjamin Muller and Mikel Artetxe and Satya Narayan Shukla and Donald Husa and Naman Goyal and Abhinandan Krishnan and Luke Zettlemoyer and Madian Khabsa},
+      year={2023},
+      eprint={2308.16884},
+      archivePrefix={arXiv},
+      primaryClass={cs.CL}
+}
+```
+### Groups and Tasks
+#### Groups
+- `belebele`: All 122 languages of the Belebele dataset, evaluated following the methodology in MMLU's original implementation.
+#### Tasks
+The following tasks evaluate languages in the Belebele dataset using loglikelihood-based multiple-choice scoring:
+- `belebele_{language}`
+The variant evaluated here is the 0-shot or few-shot evaluation with English Instructions.
+### Checklist
+* [x] Is the task an existing benchmark in the literature?
+  * [x] Have you referenced the original paper that introduced the task?
+  * [x] If yes, does the original paper provide a reference implementation?
+    * [ ] Yes, original implementation contributed by author of the benchmark
+If other tasks on this dataset are already supported:
+* [x] Is the "Main" variant of this task clearly denoted?
+* [x] Have you provided a short sentence in a README on what each new variant adds / evaluates?
+* [ ] Have you noted which, if any, published evaluation setups are matched by this variant?

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/_belebele.yaml ADDED Viewed

	@@ -0,0 +1,133 @@

+group: belebele
+task:
+  - belebele_acm_Arab
+  - belebele_arz_Arab
+  - belebele_ceb_Latn
+  - belebele_fin_Latn
+  - belebele_hin_Deva
+  - belebele_ita_Latn
+  - belebele_khm_Khmr
+  - belebele_lvs_Latn
+  - belebele_npi_Deva
+  - belebele_pol_Latn
+  - belebele_slv_Latn
+  - belebele_swe_Latn
+  - belebele_tso_Latn
+  - belebele_xho_Latn
+  - belebele_afr_Latn
+  - belebele_asm_Beng
+  - belebele_ces_Latn
+  - belebele_fra_Latn
+  - belebele_hin_Latn
+  - belebele_jav_Latn
+  - belebele_kin_Latn
+  - belebele_mal_Mlym
+  - belebele_npi_Latn
+  - belebele_por_Latn
+  - belebele_sna_Latn
+  - belebele_swh_Latn
+  - belebele_tur_Latn
+  - belebele_yor_Latn
+  - belebele_als_Latn
+  - belebele_azj_Latn
+  - belebele_ckb_Arab
+  - belebele_fuv_Latn
+  - belebele_hrv_Latn
+  - belebele_jpn_Jpan
+  - belebele_kir_Cyrl
+  - belebele_mar_Deva
+  - belebele_nso_Latn
+  - belebele_snd_Arab
+  - belebele_tam_Taml
+  - belebele_ukr_Cyrl
+  - belebele_zho_Hans
+  - belebele_amh_Ethi
+  - belebele_bam_Latn
+  - belebele_dan_Latn
+  - belebele_gaz_Latn
+  - belebele_hun_Latn
+  - belebele_kac_Latn
+  - belebele_kor_Hang
+  - belebele_mkd_Cyrl
+  - belebele_nya_Latn
+  - belebele_ron_Latn
+  - belebele_som_Latn
+  - belebele_tel_Telu
+  - belebele_urd_Arab
+  - belebele_zho_Hant
+  - belebele_apc_Arab
+  - belebele_ben_Beng
+  - belebele_deu_Latn
+  - belebele_grn_Latn
+  - belebele_hye_Armn
+  - belebele_kan_Knda
+  - belebele_lao_Laoo
+  - belebele_mlt_Latn
+  - belebele_ory_Orya
+  - belebele_rus_Cyrl
+  - belebele_sot_Latn
+  - belebele_tgk_Cyrl
+  - belebele_urd_Latn
+  - belebele_zsm_Latn
+  - belebele_arb_Arab
+  - belebele_ben_Latn
+  - belebele_ell_Grek
+  - belebele_guj_Gujr
+  - belebele_ibo_Latn
+  - belebele_kat_Geor
+  - belebele_lin_Latn
+  - belebele_mri_Latn
+  - belebele_pan_Guru
+  - belebele_shn_Mymr
+  - belebele_spa_Latn
+  - belebele_tgl_Latn
+  - belebele_uzn_Latn
+  - belebele_zul_Latn
+  - belebele_arb_Latn
+  - belebele_bod_Tibt
+  - belebele_eng_Latn
+  - belebele_hat_Latn
+  - belebele_ilo_Latn
+  - belebele_kaz_Cyrl
+  - belebele_lit_Latn
+  - belebele_mya_Mymr
+  - belebele_pbt_Arab
+  - belebele_sin_Latn
+  - belebele_srp_Cyrl
+  - belebele_tha_Thai
+  - belebele_vie_Latn
+  - belebele_ars_Arab
+  - belebele_bul_Cyrl
+  - belebele_est_Latn
+  - belebele_hau_Latn
+  - belebele_ind_Latn
+  - belebele_kea_Latn
+  - belebele_lug_Latn
+  - belebele_nld_Latn
+  - belebele_pes_Arab
+  - belebele_sin_Sinh
+  - belebele_ssw_Latn
+  - belebele_tir_Ethi
+  - belebele_war_Latn
+  - belebele_ary_Arab
+  - belebele_cat_Latn
+  - belebele_eus_Latn
+  - belebele_heb_Hebr
+  - belebele_isl_Latn
+  - belebele_khk_Cyrl
+  - belebele_luo_Latn
+  - belebele_nob_Latn
+  - belebele_plt_Latn
+  - belebele_slk_Latn
+  - belebele_sun_Latn
+  - belebele_tsn_Latn
+  - belebele_wol_Latn
+aggregate_metric_list:
+  - aggregation: mean
+    metric: acc
+    weight_by_size: true
+  - aggregation: mean
+    metric: acc_norm
+    weight_by_size: true
+metadata:
+  version: 0.0

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_acm_Arab.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "acm_Arab"
+"include": "_default_template_yaml"
+"task": "belebele_acm_Arab"
+"test_split": "acm_Arab"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_afr_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "afr_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_afr_Latn"
+"test_split": "afr_Latn"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_als_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "als_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_als_Latn"
+"test_split": "als_Latn"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_apc_Arab.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "apc_Arab"
+"include": "_default_template_yaml"
+"task": "belebele_apc_Arab"
+"test_split": "apc_Arab"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_arb_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "arb_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_arb_Latn"
+"test_split": "arb_Latn"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_ars_Arab.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "ars_Arab"
+"include": "_default_template_yaml"
+"task": "belebele_ars_Arab"
+"test_split": "ars_Arab"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_arz_Arab.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "arz_Arab"
+"include": "_default_template_yaml"
+"task": "belebele_arz_Arab"
+"test_split": "arz_Arab"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_asm_Beng.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "asm_Beng"
+"include": "_default_template_yaml"
+"task": "belebele_asm_Beng"
+"test_split": "asm_Beng"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_bam_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "bam_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_bam_Latn"
+"test_split": "bam_Latn"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_ben_Beng.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "ben_Beng"
+"include": "_default_template_yaml"
+"task": "belebele_ben_Beng"
+"test_split": "ben_Beng"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_bul_Cyrl.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "bul_Cyrl"
+"include": "_default_template_yaml"
+"task": "belebele_bul_Cyrl"
+"test_split": "bul_Cyrl"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_cat_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "cat_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_cat_Latn"
+"test_split": "cat_Latn"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_ceb_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "ceb_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_ceb_Latn"
+"test_split": "ceb_Latn"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_ckb_Arab.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "ckb_Arab"
+"include": "_default_template_yaml"
+"task": "belebele_ckb_Arab"
+"test_split": "ckb_Arab"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_dan_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "dan_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_dan_Latn"
+"test_split": "dan_Latn"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_deu_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "deu_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_deu_Latn"
+"test_split": "deu_Latn"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_eng_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "eng_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_eng_Latn"
+"test_split": "eng_Latn"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_est_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "est_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_est_Latn"
+"test_split": "est_Latn"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_fin_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "fin_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_fin_Latn"
+"test_split": "fin_Latn"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_fuv_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "fuv_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_fuv_Latn"
+"test_split": "fuv_Latn"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_gaz_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "gaz_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_gaz_Latn"
+"test_split": "gaz_Latn"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_grn_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "grn_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_grn_Latn"
+"test_split": "grn_Latn"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_guj_Gujr.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "guj_Gujr"
+"include": "_default_template_yaml"
+"task": "belebele_guj_Gujr"
+"test_split": "guj_Gujr"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_hat_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "hat_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_hat_Latn"
+"test_split": "hat_Latn"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_heb_Hebr.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "heb_Hebr"
+"include": "_default_template_yaml"
+"task": "belebele_heb_Hebr"
+"test_split": "heb_Hebr"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_hin_Deva.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "hin_Deva"
+"include": "_default_template_yaml"
+"task": "belebele_hin_Deva"
+"test_split": "hin_Deva"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_hun_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "hun_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_hun_Latn"
+"test_split": "hun_Latn"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_ibo_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "ibo_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_ibo_Latn"
+"test_split": "ibo_Latn"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_ilo_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "ilo_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_ilo_Latn"
+"test_split": "ilo_Latn"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_ind_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "ind_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_ind_Latn"
+"test_split": "ind_Latn"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_ita_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "ita_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_ita_Latn"
+"test_split": "ita_Latn"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_jav_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "jav_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_jav_Latn"
+"test_split": "jav_Latn"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_kac_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "kac_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_kac_Latn"
+"test_split": "kac_Latn"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_kat_Geor.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "kat_Geor"
+"include": "_default_template_yaml"
+"task": "belebele_kat_Geor"
+"test_split": "kat_Geor"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_kea_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "kea_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_kea_Latn"
+"test_split": "kea_Latn"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_khk_Cyrl.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "khk_Cyrl"
+"include": "_default_template_yaml"
+"task": "belebele_khk_Cyrl"
+"test_split": "khk_Cyrl"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_kin_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "kin_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_kin_Latn"
+"test_split": "kin_Latn"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_kir_Cyrl.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "kir_Cyrl"
+"include": "_default_template_yaml"
+"task": "belebele_kir_Cyrl"
+"test_split": "kir_Cyrl"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_lit_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "lit_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_lit_Latn"
+"test_split": "lit_Latn"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_lug_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "lug_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_lug_Latn"
+"test_split": "lug_Latn"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_luo_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "luo_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_luo_Latn"
+"test_split": "luo_Latn"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_lvs_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "lvs_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_lvs_Latn"
+"test_split": "lvs_Latn"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_mal_Mlym.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "mal_Mlym"
+"include": "_default_template_yaml"
+"task": "belebele_mal_Mlym"
+"test_split": "mal_Mlym"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_mar_Deva.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "mar_Deva"
+"include": "_default_template_yaml"
+"task": "belebele_mar_Deva"
+"test_split": "mar_Deva"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_mlt_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "mlt_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_mlt_Latn"
+"test_split": "mlt_Latn"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_mri_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "mri_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_mri_Latn"
+"test_split": "mri_Latn"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_npi_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "npi_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_npi_Latn"
+"test_split": "npi_Latn"

scripts/yans/lm-evaluation-harness/lm_eval/tasks/belebele/belebele_nso_Latn.yaml ADDED Viewed

	@@ -0,0 +1,4 @@

+"fewshot_split": "nso_Latn"
+"include": "_default_template_yaml"
+"task": "belebele_nso_Latn"
+"test_split": "nso_Latn"