Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
fewshot_as_multiturn
Browse files
src/leaderboard/read_evals.py
CHANGED
|
@@ -47,6 +47,7 @@ class EvalResult:
|
|
| 47 |
n_shot = data.get("n-shot")
|
| 48 |
start_date = data.get("date", 0)
|
| 49 |
chat_template = data.get("chat_template", None)
|
|
|
|
| 50 |
|
| 51 |
# Precision
|
| 52 |
precision = Precision.from_str(config.get("model_dtype"))
|
|
@@ -78,6 +79,8 @@ class EvalResult:
|
|
| 78 |
|
| 79 |
if chat_template:
|
| 80 |
org_and_model += ",chat"
|
|
|
|
|
|
|
| 81 |
|
| 82 |
org_and_model = org_and_model.split("/", 1)
|
| 83 |
|
|
|
|
| 47 |
n_shot = data.get("n-shot")
|
| 48 |
start_date = data.get("date", 0)
|
| 49 |
chat_template = data.get("chat_template", None)
|
| 50 |
+
fewshot_as_multiturn = data.get("fewshot_as_multiturn", True)
|
| 51 |
|
| 52 |
# Precision
|
| 53 |
precision = Precision.from_str(config.get("model_dtype"))
|
|
|
|
| 79 |
|
| 80 |
if chat_template:
|
| 81 |
org_and_model += ",chat"
|
| 82 |
+
if not fewshot_as_multiturn:
|
| 83 |
+
org_and_model += ",no-multiturn"
|
| 84 |
|
| 85 |
org_and_model = org_and_model.split("/", 1)
|
| 86 |
|