Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_amh.yaml +6 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_eng.yaml +6 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_ewe.yaml +6 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_fra.yaml +6 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_hau.yaml +6 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_ibo.yaml +6 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_kin.yaml +6 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_lin.yaml +6 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_lug.yaml +6 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_orm.yaml +6 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_sna.yaml +6 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_sot.yaml +6 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_swa.yaml +6 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_twi.yaml +6 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_wol.yaml +6 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_xho.yaml +6 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_yaml +25 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_yor.yaml +6 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_zul.yaml +6 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/utils.py +1 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_fra.yaml +4 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_hau.yaml +4 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_kin.yaml +4 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_lug.yaml +4 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_orm.yaml +4 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_sna.yaml +4 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_sot.yaml +4 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_swa.yaml +4 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_xho.yaml +4 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_yaml +32 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/translate/utils.py +6 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_amh.yaml +4 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_eng.yaml +4 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_ewe.yaml +4 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_fra.yaml +4 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_hau.yaml +4 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_ibo.yaml +4 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_kin.yaml +4 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_lin.yaml +4 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_lug.yaml +4 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_orm.yaml +4 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_sna.yaml +4 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_sot.yaml +4 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_swa.yaml +4 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_twi.yaml +4 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_wol.yaml +4 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_xho.yaml +4 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_yaml +31 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_yor.yaml +4 -0
- scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_zul.yaml +4 -0
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_amh.yaml
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: amh
|
| 3 |
+
doc_to_choice: '{{[premise+", ትክክል? አዎ, "+hypothesis,premise+", ትክክል? እንዲሁም, "+hypothesis,premise+",
|
| 4 |
+
ትክክል? አይ, "+hypothesis]}}'
|
| 5 |
+
include: afrixnli_native_direct_yaml
|
| 6 |
+
task: afrixnli_native_direct_amh
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_eng.yaml
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: eng
|
| 3 |
+
doc_to_choice: '{{[premise+", Right? Yes, "+hypothesis,premise+", Right? Also, "+hypothesis,premise+",
|
| 4 |
+
Right? No, "+hypothesis]}}'
|
| 5 |
+
include: afrixnli_native_direct_yaml
|
| 6 |
+
task: afrixnli_native_direct_eng
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_ewe.yaml
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: ewe
|
| 3 |
+
doc_to_choice: '{{[premise+", Esɔ gbe? Ɛ̃, "+hypothesis,premise+", Esɔ gbe? Hã, "+hypothesis,premise+",
|
| 4 |
+
Esɔ gbe? Ao, "+hypothesis]}}'
|
| 5 |
+
include: afrixnli_native_direct_yaml
|
| 6 |
+
task: afrixnli_native_direct_ewe
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_fra.yaml
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: fra
|
| 3 |
+
doc_to_choice: '{{[premise+", correct? Oui, "+hypothesis,premise+", correct? Aussi,
|
| 4 |
+
"+hypothesis,premise+", correct? Non, "+hypothesis]}}'
|
| 5 |
+
include: afrixnli_native_direct_yaml
|
| 6 |
+
task: afrixnli_native_direct_fra
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_hau.yaml
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: hau
|
| 3 |
+
doc_to_choice: '{{[premise+", Daidai? Ee, "+hypothesis,premise+", Daidai? Haka kuma,
|
| 4 |
+
"+hypothesis,premise+", Daidai? A''a, "+hypothesis]}}'
|
| 5 |
+
include: afrixnli_native_direct_yaml
|
| 6 |
+
task: afrixnli_native_direct_hau
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_ibo.yaml
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: ibo
|
| 3 |
+
doc_to_choice: '{{[premise+", Ziri ezi? Éè, "+hypothesis,premise+", Ziri ezi? Ọzọkwa,
|
| 4 |
+
"+hypothesis,premise+", Ziri ezi? Mba, "+hypothesis]}}'
|
| 5 |
+
include: afrixnli_native_direct_yaml
|
| 6 |
+
task: afrixnli_native_direct_ibo
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_kin.yaml
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: kin
|
| 3 |
+
doc_to_choice: '{{[premise+", Nibyo? Yego, "+hypothesis,premise+", Nibyo? Na none,
|
| 4 |
+
"+hypothesis,premise+", Nibyo? Oya, "+hypothesis]}}'
|
| 5 |
+
include: afrixnli_native_direct_yaml
|
| 6 |
+
task: afrixnli_native_direct_kin
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_lin.yaml
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: lin
|
| 3 |
+
doc_to_choice: '{{[premise+", Malamu? Iyo, "+hypothesis,premise+", Malamu? Lisusu,
|
| 4 |
+
"+hypothesis,premise+", Malamu? Te, "+hypothesis]}}'
|
| 5 |
+
include: afrixnli_native_direct_yaml
|
| 6 |
+
task: afrixnli_native_direct_lin
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_lug.yaml
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: lug
|
| 3 |
+
doc_to_choice: '{{[premise+", Kituufu? Yee, "+hypothesis,premise+", Kituufu? N’ekirala,
|
| 4 |
+
"+hypothesis,premise+", Kituufu? Nedda, "+hypothesis]}}'
|
| 5 |
+
include: afrixnli_native_direct_yaml
|
| 6 |
+
task: afrixnli_native_direct_lug
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_orm.yaml
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: orm
|
| 3 |
+
doc_to_choice: '{{[premise+", Sirrii? Eeyyee, "+hypothesis,premise+", Sirrii? Akkasumas,
|
| 4 |
+
"+hypothesis,premise+", Sirrii? Lakki, "+hypothesis]}}'
|
| 5 |
+
include: afrixnli_native_direct_yaml
|
| 6 |
+
task: afrixnli_native_direct_orm
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_sna.yaml
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: sna
|
| 3 |
+
doc_to_choice: '{{[premise+", Chokwadi? Hongu, "+hypothesis,premise+", Chokwadi? Uye,
|
| 4 |
+
"+hypothesis,premise+", Chokwadi? Kwete, "+hypothesis]}}'
|
| 5 |
+
include: afrixnli_native_direct_yaml
|
| 6 |
+
task: afrixnli_native_direct_sna
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_sot.yaml
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: sot
|
| 3 |
+
doc_to_choice: '{{[premise+", Nepile? E, "+hypothesis,premise+", Nepile? Hape, "+hypothesis,premise+",
|
| 4 |
+
Nepile? Tjhe, "+hypothesis]}}'
|
| 5 |
+
include: afrixnli_native_direct_yaml
|
| 6 |
+
task: afrixnli_native_direct_sot
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_swa.yaml
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: swa
|
| 3 |
+
doc_to_choice: '{{[premise+", Sahihi? Ndiyo, "+hypothesis,premise+", Sahihi? Pia,
|
| 4 |
+
"+hypothesis,premise+", Sahihi? Hapana, "+hypothesis]}}'
|
| 5 |
+
include: afrixnli_native_direct_yaml
|
| 6 |
+
task: afrixnli_native_direct_swa
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_twi.yaml
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: twi
|
| 3 |
+
doc_to_choice: '{{[premise+", Nifa? Aane, "+hypothesis,premise+", Nifa? Anaasɛ, "+hypothesis,premise+",
|
| 4 |
+
Nifa? Daabi, "+hypothesis]}}'
|
| 5 |
+
include: afrixnli_native_direct_yaml
|
| 6 |
+
task: afrixnli_native_direct_twi
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_wol.yaml
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: wol
|
| 3 |
+
doc_to_choice: '{{[premise+", Dëgg? Waaw, "+hypothesis,premise+", Dëgg? Itam, "+hypothesis,premise+",
|
| 4 |
+
Dëgg? Déet, "+hypothesis]}}'
|
| 5 |
+
include: afrixnli_native_direct_yaml
|
| 6 |
+
task: afrixnli_native_direct_wol
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_xho.yaml
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: xho
|
| 3 |
+
doc_to_choice: '{{[premise+", Ichanekile? Ewe, "+hypothesis,premise+", Ichanekile?
|
| 4 |
+
Kananjalo, "+hypothesis,premise+", Ichanekile? Hayi, "+hypothesis]}}'
|
| 5 |
+
include: afrixnli_native_direct_yaml
|
| 6 |
+
task: afrixnli_native_direct_xho
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_yaml
ADDED
|
@@ -0,0 +1,25 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
group:
|
| 2 |
+
- afrixnli
|
| 3 |
+
- afrixnli_native_direct
|
| 4 |
+
dataset_path: masakhane/afrixnli
|
| 5 |
+
dataset_name: null
|
| 6 |
+
output_type: multiple_choice
|
| 7 |
+
validation_split: validation
|
| 8 |
+
test_split: test
|
| 9 |
+
fewshot_split: validation
|
| 10 |
+
doc_to_target: label
|
| 11 |
+
doc_to_text: ""
|
| 12 |
+
metric_list:
|
| 13 |
+
- metric: f1
|
| 14 |
+
aggregation: !function utils.weighted_f1_score
|
| 15 |
+
average: weighted
|
| 16 |
+
higher_is_better: True
|
| 17 |
+
ignore_case: true
|
| 18 |
+
ignore_punctuation: true
|
| 19 |
+
- metric: acc
|
| 20 |
+
aggregation: mean
|
| 21 |
+
higher_is_better: true
|
| 22 |
+
ignore_case: true
|
| 23 |
+
ignore_punctuation: true
|
| 24 |
+
metadata:
|
| 25 |
+
version: 1.0
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_yor.yaml
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: yor
|
| 3 |
+
doc_to_choice: '{{[premise+", Òótọ́? Bẹ́ẹ̀ni, "+hypothesis,premise+", Òótọ́? Àti pé,
|
| 4 |
+
"+hypothesis,premise+", Òótọ́? Rárá, "+hypothesis]}}'
|
| 5 |
+
include: afrixnli_native_direct_yaml
|
| 6 |
+
task: afrixnli_native_direct_yor
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/afrixnli_native_direct_zul.yaml
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: zul
|
| 3 |
+
doc_to_choice: '{{[premise+", Kulungile? Yebo, "+hypothesis,premise+", Kulungile?
|
| 4 |
+
Futhi, "+hypothesis,premise+", Kulungile? Cha, "+hypothesis]}}'
|
| 5 |
+
include: afrixnli_native_direct_yaml
|
| 6 |
+
task: afrixnli_native_direct_zul
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/native-direct/utils.py
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
from lm_eval.utils import weighted_f1_score
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_fra.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: fra
|
| 3 |
+
include: afrixnli_translate_yaml
|
| 4 |
+
task: afrixnli_translate_fra
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_hau.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: hau
|
| 3 |
+
include: afrixnli_translate_yaml
|
| 4 |
+
task: afrixnli_translate_hau
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_kin.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: kin
|
| 3 |
+
include: afrixnli_translate_yaml
|
| 4 |
+
task: afrixnli_translate_kin
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_lug.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: lug
|
| 3 |
+
include: afrixnli_translate_yaml
|
| 4 |
+
task: afrixnli_translate_lug
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_orm.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: orm
|
| 3 |
+
include: afrixnli_translate_yaml
|
| 4 |
+
task: afrixnli_translate_orm
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_sna.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: sna
|
| 3 |
+
include: afrixnli_translate_yaml
|
| 4 |
+
task: afrixnli_translate_sna
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_sot.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: sot
|
| 3 |
+
include: afrixnli_translate_yaml
|
| 4 |
+
task: afrixnli_translate_sot
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_swa.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: swa
|
| 3 |
+
include: afrixnli_translate_yaml
|
| 4 |
+
task: afrixnli_translate_swa
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_xho.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: xho
|
| 3 |
+
include: afrixnli_translate_yaml
|
| 4 |
+
task: afrixnli_translate_xho
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/translate/afrixnli_translate_yaml
ADDED
|
@@ -0,0 +1,32 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
group:
|
| 2 |
+
- afrixnli
|
| 3 |
+
- afrixnli_translate
|
| 4 |
+
dataset_path: masakhane/afrixnli-translate-test
|
| 5 |
+
dataset_name: null
|
| 6 |
+
output_type: multiple_choice
|
| 7 |
+
test_split: test
|
| 8 |
+
doc_to_text: "{{premise}}\nQuestion: {{hypothesis}} True, False, or Neither?\nAnswer:"
|
| 9 |
+
# True = entailment
|
| 10 |
+
# False = contradiction
|
| 11 |
+
# Neither = neutral
|
| 12 |
+
doc_to_target: !function utils.doc_to_target
|
| 13 |
+
doc_to_choice:
|
| 14 |
+
- "True"
|
| 15 |
+
- "Neither"
|
| 16 |
+
- "False"
|
| 17 |
+
should_decontaminate: true
|
| 18 |
+
doc_to_decontamination_query: premise
|
| 19 |
+
metric_list:
|
| 20 |
+
- metric: f1
|
| 21 |
+
aggregation: !function utils.weighted_f1_score
|
| 22 |
+
average: weighted
|
| 23 |
+
higher_is_better: True
|
| 24 |
+
ignore_case: true
|
| 25 |
+
ignore_punctuation: true
|
| 26 |
+
- metric: acc
|
| 27 |
+
aggregation: mean
|
| 28 |
+
higher_is_better: true
|
| 29 |
+
ignore_case: true
|
| 30 |
+
ignore_punctuation: true
|
| 31 |
+
metadata:
|
| 32 |
+
version: 1.0
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/anli prompt/translate/utils.py
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
from lm_eval.utils import weighted_f1_score
|
| 2 |
+
|
| 3 |
+
|
| 4 |
+
def doc_to_target(doc):
|
| 5 |
+
replacements = {0: "True", 1: "Neither", 2: "False"}
|
| 6 |
+
return replacements[doc["label"]]
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_amh.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: amh
|
| 3 |
+
include: afrixnli_manual_direct_yaml
|
| 4 |
+
task: afrixnli_manual_direct_amh
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_eng.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: eng
|
| 3 |
+
include: afrixnli_manual_direct_yaml
|
| 4 |
+
task: afrixnli_manual_direct_eng
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_ewe.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: ewe
|
| 3 |
+
include: afrixnli_manual_direct_yaml
|
| 4 |
+
task: afrixnli_manual_direct_ewe
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_fra.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: fra
|
| 3 |
+
include: afrixnli_manual_direct_yaml
|
| 4 |
+
task: afrixnli_manual_direct_fra
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_hau.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: hau
|
| 3 |
+
include: afrixnli_manual_direct_yaml
|
| 4 |
+
task: afrixnli_manual_direct_hau
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_ibo.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: ibo
|
| 3 |
+
include: afrixnli_manual_direct_yaml
|
| 4 |
+
task: afrixnli_manual_direct_ibo
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_kin.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: kin
|
| 3 |
+
include: afrixnli_manual_direct_yaml
|
| 4 |
+
task: afrixnli_manual_direct_kin
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_lin.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: lin
|
| 3 |
+
include: afrixnli_manual_direct_yaml
|
| 4 |
+
task: afrixnli_manual_direct_lin
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_lug.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: lug
|
| 3 |
+
include: afrixnli_manual_direct_yaml
|
| 4 |
+
task: afrixnli_manual_direct_lug
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_orm.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: orm
|
| 3 |
+
include: afrixnli_manual_direct_yaml
|
| 4 |
+
task: afrixnli_manual_direct_orm
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_sna.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: sna
|
| 3 |
+
include: afrixnli_manual_direct_yaml
|
| 4 |
+
task: afrixnli_manual_direct_sna
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_sot.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: sot
|
| 3 |
+
include: afrixnli_manual_direct_yaml
|
| 4 |
+
task: afrixnli_manual_direct_sot
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_swa.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: swa
|
| 3 |
+
include: afrixnli_manual_direct_yaml
|
| 4 |
+
task: afrixnli_manual_direct_swa
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_twi.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: twi
|
| 3 |
+
include: afrixnli_manual_direct_yaml
|
| 4 |
+
task: afrixnli_manual_direct_twi
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_wol.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: wol
|
| 3 |
+
include: afrixnli_manual_direct_yaml
|
| 4 |
+
task: afrixnli_manual_direct_wol
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_xho.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: xho
|
| 3 |
+
include: afrixnli_manual_direct_yaml
|
| 4 |
+
task: afrixnli_manual_direct_xho
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_yaml
ADDED
|
@@ -0,0 +1,31 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
group:
|
| 2 |
+
- afrixnli
|
| 3 |
+
- afrixnli_manual_direct
|
| 4 |
+
dataset_path: masakhane/afrixnli
|
| 5 |
+
dataset_name: null
|
| 6 |
+
output_type: multiple_choice
|
| 7 |
+
validation_split: validation
|
| 8 |
+
test_split: test
|
| 9 |
+
fewshot_split: validation
|
| 10 |
+
doc_to_text: !function utils.doc_to_text
|
| 11 |
+
doc_to_target: !function utils.doc_to_target
|
| 12 |
+
doc_to_choice:
|
| 13 |
+
- "entailment"
|
| 14 |
+
- "neutral"
|
| 15 |
+
- "contradiction"
|
| 16 |
+
should_decontaminate: true
|
| 17 |
+
doc_to_decontamination_query: premise
|
| 18 |
+
metric_list:
|
| 19 |
+
- metric: f1
|
| 20 |
+
aggregation: !function utils.weighted_f1_score
|
| 21 |
+
average: weighted
|
| 22 |
+
higher_is_better: True
|
| 23 |
+
ignore_case: true
|
| 24 |
+
ignore_punctuation: true
|
| 25 |
+
- metric: acc
|
| 26 |
+
aggregation: mean
|
| 27 |
+
higher_is_better: true
|
| 28 |
+
ignore_case: true
|
| 29 |
+
ignore_punctuation: true
|
| 30 |
+
metadata:
|
| 31 |
+
version: 1.0
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_yor.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: yor
|
| 3 |
+
include: afrixnli_manual_direct_yaml
|
| 4 |
+
task: afrixnli_manual_direct_yor
|
scripts/yans/lm-evaluation-harness/lm_eval/tasks/afrixnli/lai prompt/direct/afrixnli_manual_direct_zul.yaml
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# Generated by utils.py
|
| 2 |
+
dataset_name: zul
|
| 3 |
+
include: afrixnli_manual_direct_yaml
|
| 4 |
+
task: afrixnli_manual_direct_zul
|