Spaces:
Running
Running
openhands openhands commited on
Commit ·
dd11f84
1
Parent(s): 9b84cf0
Fix runtime columns not appearing in table and scatter plots
Browse files- Add runtime columns to DataTransformer.view() output:
- Add primary_runtime_col (Average Runtime for Overall, {Category} Runtime otherwise)
- Include runtime columns for each category/benchmark in metrics_to_display
This fixes the issue where runtime data was loaded correctly but wasn't being
passed through to the display table and scatter plots.
Co-authored-by: openhands <openhands@all-hands.dev>
leaderboard_transformer.py
CHANGED
|
@@ -318,16 +318,19 @@ class DataTransformer:
|
|
| 318 |
new_cols = ["Openness"]
|
| 319 |
ending_cols = ["Date", "Logs"]
|
| 320 |
|
| 321 |
-
# For Overall view, use "Average Cost"
|
| 322 |
if tag is None or tag == "Overall":
|
| 323 |
primary_cost_col = "Average Cost"
|
|
|
|
| 324 |
else:
|
| 325 |
primary_cost_col = f"{primary_metric} Cost"
|
|
|
|
| 326 |
|
| 327 |
-
metrics_to_display = [primary_score_col, primary_cost_col]
|
| 328 |
for item in group_metrics:
|
| 329 |
metrics_to_display.append(f"{item} Score")
|
| 330 |
metrics_to_display.append(f"{item} Cost")
|
|
|
|
| 331 |
|
| 332 |
final_cols_ordered = new_cols + base_cols + list(dict.fromkeys(metrics_to_display)) + ending_cols
|
| 333 |
|
|
|
|
| 318 |
new_cols = ["Openness"]
|
| 319 |
ending_cols = ["Date", "Logs"]
|
| 320 |
|
| 321 |
+
# For Overall view, use "Average Cost" and "Average Runtime" (per instance across all benchmarks)
|
| 322 |
if tag is None or tag == "Overall":
|
| 323 |
primary_cost_col = "Average Cost"
|
| 324 |
+
primary_runtime_col = "Average Runtime"
|
| 325 |
else:
|
| 326 |
primary_cost_col = f"{primary_metric} Cost"
|
| 327 |
+
primary_runtime_col = f"{primary_metric} Runtime"
|
| 328 |
|
| 329 |
+
metrics_to_display = [primary_score_col, primary_cost_col, primary_runtime_col]
|
| 330 |
for item in group_metrics:
|
| 331 |
metrics_to_display.append(f"{item} Score")
|
| 332 |
metrics_to_display.append(f"{item} Cost")
|
| 333 |
+
metrics_to_display.append(f"{item} Runtime")
|
| 334 |
|
| 335 |
final_cols_ordered = new_cols + base_cols + list(dict.fromkeys(metrics_to_display)) + ending_cols
|
| 336 |
|