Spaces:
Running
Running
Ilker Kesen
commited on
Commit
·
7987659
1
Parent(s):
489c22a
update results
Browse files- app.py +1 -0
- data/datasets.json +1 -1
- results/zero-shot/aya-23-8b.json +7 -0
- results/zero-shot/kanarya-2b.json +3 -3
- results/zero-shot/llama-3.1-8b-instruct.json +19 -12
- results/zero-shot/llama-3.1-8b.json +39 -0
app.py
CHANGED
|
@@ -44,6 +44,7 @@ def cache_datasets(path):
|
|
| 44 |
datasets = json.load(f)
|
| 45 |
for key in datasets.keys():
|
| 46 |
datasets[key]['dataset'] = key
|
|
|
|
| 47 |
return datasets
|
| 48 |
|
| 49 |
|
|
|
|
| 44 |
datasets = json.load(f)
|
| 45 |
for key in datasets.keys():
|
| 46 |
datasets[key]['dataset'] = key
|
| 47 |
+
del datasets['tr-wikihow-summ'] # FIXME: There are missing experiments.
|
| 48 |
return datasets
|
| 49 |
|
| 50 |
|
data/datasets.json
CHANGED
|
@@ -48,7 +48,7 @@
|
|
| 48 |
"generative": true
|
| 49 |
},
|
| 50 |
"tr-wikihow-summ": {
|
| 51 |
-
"name": "
|
| 52 |
"task": "summarization",
|
| 53 |
"description": "A summarization dataset obtained from WikiHow website.",
|
| 54 |
"url": "https://huggingface.co/datasets/ardauzunoglu/tr-wikihow-summ",
|
|
|
|
| 48 |
"generative": true
|
| 49 |
},
|
| 50 |
"tr-wikihow-summ": {
|
| 51 |
+
"name": "WikiHow",
|
| 52 |
"task": "summarization",
|
| 53 |
"description": "A summarization dataset obtained from WikiHow website.",
|
| 54 |
"url": "https://huggingface.co/datasets/ardauzunoglu/tr-wikihow-summ",
|
results/zero-shot/aya-23-8b.json
CHANGED
|
@@ -150,6 +150,13 @@
|
|
| 150 |
"wer": 0.7464128097803795,
|
| 151 |
"bleu": 0.16878189334002527
|
| 152 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 153 |
{
|
| 154 |
"name": "xlsum_tr",
|
| 155 |
"task": "summarization",
|
|
|
|
| 150 |
"wer": 0.7464128097803795,
|
| 151 |
"bleu": 0.16878189334002527
|
| 152 |
},
|
| 153 |
+
{
|
| 154 |
+
"name": "tr-wikihow-summ",
|
| 155 |
+
"task": "summarization",
|
| 156 |
+
"rouge1": 0.04023948542641836,
|
| 157 |
+
"rouge2": 0.0169810919324388,
|
| 158 |
+
"rougeL": 0.03296869279651223
|
| 159 |
+
},
|
| 160 |
{
|
| 161 |
"name": "xlsum_tr",
|
| 162 |
"task": "summarization",
|
results/zero-shot/kanarya-2b.json
CHANGED
|
@@ -157,9 +157,9 @@
|
|
| 157 |
{
|
| 158 |
"name": "tr-wikihow-summ",
|
| 159 |
"task": "summarization",
|
| 160 |
-
"rouge1":
|
| 161 |
-
"rouge2":
|
| 162 |
-
"rougeL":
|
| 163 |
},
|
| 164 |
{
|
| 165 |
"name": "xquad_tr",
|
|
|
|
| 157 |
{
|
| 158 |
"name": "tr-wikihow-summ",
|
| 159 |
"task": "summarization",
|
| 160 |
+
"rouge1": 0.18320144404095734,
|
| 161 |
+
"rouge2": 0.05292686441577856,
|
| 162 |
+
"rougeL": 0.13617779525430102
|
| 163 |
},
|
| 164 |
{
|
| 165 |
"name": "xquad_tr",
|
results/zero-shot/llama-3.1-8b-instruct.json
CHANGED
|
@@ -126,34 +126,41 @@
|
|
| 126 |
{
|
| 127 |
"name": "gecturk_generation",
|
| 128 |
"task": "grammatical_error_correction",
|
| 129 |
-
"exact_match": 0.
|
| 130 |
},
|
| 131 |
{
|
| 132 |
"name": "mlsum_tr",
|
| 133 |
"task": "summarization",
|
| 134 |
-
"rouge1": 0.
|
| 135 |
-
"rouge2": 0.
|
| 136 |
-
"rougeL": 0.
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 137 |
},
|
| 138 |
{
|
| 139 |
"name": "wiki_lingua_tr",
|
| 140 |
"task": "summarization",
|
| 141 |
-
"rouge1": 0.
|
| 142 |
-
"rouge2": 0.
|
| 143 |
-
"rougeL": 0.
|
| 144 |
},
|
| 145 |
{
|
| 146 |
"name": "wmt-tr-en-prompt",
|
| 147 |
"task": "machine_translation",
|
| 148 |
-
"wer": 0.
|
| 149 |
-
"bleu": 0.
|
| 150 |
},
|
| 151 |
{
|
| 152 |
"name": "xlsum_tr",
|
| 153 |
"task": "summarization",
|
| 154 |
-
"rouge1": 0.
|
| 155 |
-
"rouge2": 0.
|
| 156 |
-
"rougeL": 0.
|
| 157 |
}
|
| 158 |
]
|
| 159 |
}
|
|
|
|
| 126 |
{
|
| 127 |
"name": "gecturk_generation",
|
| 128 |
"task": "grammatical_error_correction",
|
| 129 |
+
"exact_match": 0.006548220906158217
|
| 130 |
},
|
| 131 |
{
|
| 132 |
"name": "mlsum_tr",
|
| 133 |
"task": "summarization",
|
| 134 |
+
"rouge1": 0.3970732593089523,
|
| 135 |
+
"rouge2": 0.2580847974481608,
|
| 136 |
+
"rougeL": 0.32541870004323864
|
| 137 |
+
},
|
| 138 |
+
{
|
| 139 |
+
"name": "tr-wikihow-summ",
|
| 140 |
+
"task": "summarization",
|
| 141 |
+
"rouge1": 0.2444219472309469,
|
| 142 |
+
"rouge2": 0.07918689923056912,
|
| 143 |
+
"rougeL": 0.1723711997990579
|
| 144 |
},
|
| 145 |
{
|
| 146 |
"name": "wiki_lingua_tr",
|
| 147 |
"task": "summarization",
|
| 148 |
+
"rouge1": 0.22962802442673436,
|
| 149 |
+
"rouge2": 0.07863769381205138,
|
| 150 |
+
"rougeL": 0.16924353815052512
|
| 151 |
},
|
| 152 |
{
|
| 153 |
"name": "wmt-tr-en-prompt",
|
| 154 |
"task": "machine_translation",
|
| 155 |
+
"wer": 0.7815049287082738,
|
| 156 |
+
"bleu": 0.1564145890661644
|
| 157 |
},
|
| 158 |
{
|
| 159 |
"name": "xlsum_tr",
|
| 160 |
"task": "summarization",
|
| 161 |
+
"rouge1": 0.2805962791068744,
|
| 162 |
+
"rouge2": 0.12421139697660691,
|
| 163 |
+
"rougeL": 0.21080710839195932
|
| 164 |
}
|
| 165 |
]
|
| 166 |
}
|
results/zero-shot/llama-3.1-8b.json
CHANGED
|
@@ -122,6 +122,45 @@
|
|
| 122 |
"task": "extractive_question_answering",
|
| 123 |
"exact_match": 0.2092436974789916,
|
| 124 |
"f1": 0.35674599908781446
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 125 |
}
|
| 126 |
]
|
| 127 |
}
|
|
|
|
| 122 |
"task": "extractive_question_answering",
|
| 123 |
"exact_match": 0.2092436974789916,
|
| 124 |
"f1": 0.35674599908781446
|
| 125 |
+
},
|
| 126 |
+
{
|
| 127 |
+
"name": "gecturk_generation",
|
| 128 |
+
"task": "grammatical_error_correction",
|
| 129 |
+
"exact_match": 0.006548220906158217
|
| 130 |
+
},
|
| 131 |
+
{
|
| 132 |
+
"name": "mlsum_tr",
|
| 133 |
+
"task": "summarization",
|
| 134 |
+
"rouge1": 0.3970732593089523,
|
| 135 |
+
"rouge2": 0.2580847974481608,
|
| 136 |
+
"rougeL": 0.32541870004323864
|
| 137 |
+
},
|
| 138 |
+
{
|
| 139 |
+
"name": "tr-wikihow-summ",
|
| 140 |
+
"task": "summarization",
|
| 141 |
+
"rouge1": 0.2444219472309469,
|
| 142 |
+
"rouge2": 0.07918689923056912,
|
| 143 |
+
"rougeL": 0.1723711997990579
|
| 144 |
+
},
|
| 145 |
+
{
|
| 146 |
+
"name": "wiki_lingua_tr",
|
| 147 |
+
"task": "summarization",
|
| 148 |
+
"rouge1": 0.22962802442673436,
|
| 149 |
+
"rouge2": 0.07863769381205138,
|
| 150 |
+
"rougeL": 0.16924353815052512
|
| 151 |
+
},
|
| 152 |
+
{
|
| 153 |
+
"name": "wmt-tr-en-prompt",
|
| 154 |
+
"task": "machine_translation",
|
| 155 |
+
"wer": 0.7815049287082738,
|
| 156 |
+
"bleu": 0.1564145890661644
|
| 157 |
+
},
|
| 158 |
+
{
|
| 159 |
+
"name": "xlsum_tr",
|
| 160 |
+
"task": "summarization",
|
| 161 |
+
"rouge1": 0.2805962791068744,
|
| 162 |
+
"rouge2": 0.12421139697660691,
|
| 163 |
+
"rougeL": 0.21080710839195932
|
| 164 |
}
|
| 165 |
]
|
| 166 |
}
|