openhands openhands commited on
Commit
dd11f84
·
1 Parent(s): 9b84cf0

Fix runtime columns not appearing in table and scatter plots

Browse files

- Add runtime columns to DataTransformer.view() output:
- Add primary_runtime_col (Average Runtime for Overall, {Category} Runtime otherwise)
- Include runtime columns for each category/benchmark in metrics_to_display

This fixes the issue where runtime data was loaded correctly but wasn't being
passed through to the display table and scatter plots.

Co-authored-by: openhands <openhands@all-hands.dev>

Files changed (1) hide show
  1. leaderboard_transformer.py +5 -2
leaderboard_transformer.py CHANGED
@@ -318,16 +318,19 @@ class DataTransformer:
318
  new_cols = ["Openness"]
319
  ending_cols = ["Date", "Logs"]
320
 
321
- # For Overall view, use "Average Cost" (average cost per instance across all benchmarks)
322
  if tag is None or tag == "Overall":
323
  primary_cost_col = "Average Cost"
 
324
  else:
325
  primary_cost_col = f"{primary_metric} Cost"
 
326
 
327
- metrics_to_display = [primary_score_col, primary_cost_col]
328
  for item in group_metrics:
329
  metrics_to_display.append(f"{item} Score")
330
  metrics_to_display.append(f"{item} Cost")
 
331
 
332
  final_cols_ordered = new_cols + base_cols + list(dict.fromkeys(metrics_to_display)) + ending_cols
333
 
 
318
  new_cols = ["Openness"]
319
  ending_cols = ["Date", "Logs"]
320
 
321
+ # For Overall view, use "Average Cost" and "Average Runtime" (per instance across all benchmarks)
322
  if tag is None or tag == "Overall":
323
  primary_cost_col = "Average Cost"
324
+ primary_runtime_col = "Average Runtime"
325
  else:
326
  primary_cost_col = f"{primary_metric} Cost"
327
+ primary_runtime_col = f"{primary_metric} Runtime"
328
 
329
+ metrics_to_display = [primary_score_col, primary_cost_col, primary_runtime_col]
330
  for item in group_metrics:
331
  metrics_to_display.append(f"{item} Score")
332
  metrics_to_display.append(f"{item} Cost")
333
+ metrics_to_display.append(f"{item} Runtime")
334
 
335
  final_cols_ordered = new_cols + base_cols + list(dict.fromkeys(metrics_to_display)) + ending_cols
336