Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
|
@@ -161,9 +161,9 @@ def add_new_eval(
|
|
| 161 |
)
|
| 162 |
|
| 163 |
accuracy = float("{:.1f}".format(np.average([x["score"] for x in all_scores]) * 100))
|
| 164 |
-
coverage = float("{:.1f}".format(np.average([x["has_ans"] for x in all_scores])))
|
| 165 |
-
em = float("{:.1f}".format(np.average([1 if x["score"] == 1 else 0 for x in all_scores])))
|
| 166 |
-
precision = float("{:.1f}".format(np.average([x["score"] for x in all_scores if x["has_ans"] == 1])))
|
| 167 |
|
| 168 |
eval_entry = {
|
| 169 |
"Model Name": model_name,
|
|
|
|
| 161 |
)
|
| 162 |
|
| 163 |
accuracy = float("{:.1f}".format(np.average([x["score"] for x in all_scores]) * 100))
|
| 164 |
+
coverage = float("{:.1f}".format(np.average([x["has_ans"] for x in all_scores]) * 100))
|
| 165 |
+
em = float("{:.1f}".format(np.average([1 if x["score"] == 1 else 0 for x in all_scores]) * 100))
|
| 166 |
+
precision = float("{:.1f}".format(np.average([x["score"] for x in all_scores if x["has_ans"] == 1]) * 100))
|
| 167 |
|
| 168 |
eval_entry = {
|
| 169 |
"Model Name": model_name,
|