Spaces:
Sleeping
Sleeping
Commit ·
bc83a77
1
Parent(s): 6c6a1f3
add thinks
Browse files
about.py
CHANGED
|
@@ -41,5 +41,6 @@ METRIC_INFO_TEXT = """
|
|
| 41 |
|
| 42 |
- **Meter** - How closely the model sticks to the meter of the lines.
|
| 43 |
- **Verse** - How closely the model aligns the lines to the verse and chorus breakup.
|
| 44 |
-
- **Focus** - How much of the response is extraneous commentary instead of the song. Focus in particular has a very minor contribution to the final score
|
|
|
|
| 45 |
"""
|
|
|
|
| 41 |
|
| 42 |
- **Meter** - How closely the model sticks to the meter of the lines.
|
| 43 |
- **Verse** - How closely the model aligns the lines to the verse and chorus breakup.
|
| 44 |
+
- **Focus** - How much of the response is extraneous commentary instead of the song. *(Focus in particular has a very minor contribution to the final score)*
|
| 45 |
+
- **Thinking** - The **averaged** number of thinking tokens per response. Zero means it's not a reasoning model.
|
| 46 |
"""
|
utils.py
CHANGED
|
@@ -68,6 +68,7 @@ def load_leaderboard() -> pd.DataFrame:
|
|
| 68 |
"meter_score": "Meter",
|
| 69 |
"verse_score": "Verse",
|
| 70 |
"focus_score": "Focus",
|
|
|
|
| 71 |
"evaluated_at": "Evaluated At",
|
| 72 |
}
|
| 73 |
display_cols = [c for c in col_map if c in df.columns]
|
|
@@ -116,12 +117,9 @@ def load_leaderboard() -> pd.DataFrame:
|
|
| 116 |
"Meter": "{:.1%}",
|
| 117 |
"Verse": "{:.1%}",
|
| 118 |
"Focus": "{:.1%}",
|
|
|
|
| 119 |
})
|
| 120 |
.hide(axis="index")
|
| 121 |
-
.set_table_styles([
|
| 122 |
-
dict(selector='th', props=[('text-align', 'center')]),
|
| 123 |
-
dict(selector='td', props=[('text-align', 'center')]),
|
| 124 |
-
])
|
| 125 |
)
|
| 126 |
|
| 127 |
return styled
|
|
@@ -140,6 +138,7 @@ def empty_leaderboard() -> pd.DataFrame:
|
|
| 140 |
"Meter",
|
| 141 |
"Verse",
|
| 142 |
"Focus",
|
|
|
|
| 143 |
"Evaluated At",
|
| 144 |
]
|
| 145 |
)
|
|
|
|
| 68 |
"meter_score": "Meter",
|
| 69 |
"verse_score": "Verse",
|
| 70 |
"focus_score": "Focus",
|
| 71 |
+
"avg_think_tokens": "Thinking",
|
| 72 |
"evaluated_at": "Evaluated At",
|
| 73 |
}
|
| 74 |
display_cols = [c for c in col_map if c in df.columns]
|
|
|
|
| 117 |
"Meter": "{:.1%}",
|
| 118 |
"Verse": "{:.1%}",
|
| 119 |
"Focus": "{:.1%}",
|
| 120 |
+
"Thinking": "{:0.0f}",
|
| 121 |
})
|
| 122 |
.hide(axis="index")
|
|
|
|
|
|
|
|
|
|
|
|
|
| 123 |
)
|
| 124 |
|
| 125 |
return styled
|
|
|
|
| 138 |
"Meter",
|
| 139 |
"Verse",
|
| 140 |
"Focus",
|
| 141 |
+
"Thinking",
|
| 142 |
"Evaluated At",
|
| 143 |
]
|
| 144 |
)
|