dror44 commited on
Commit
f663644
·
1 Parent(s): d590c57

fix confidences

Browse files
Files changed (1) hide show
  1. src/app.py +15 -2
src/app.py CHANGED
@@ -17,6 +17,19 @@ selected_judges: list = []
17
  current_test_type: str = "grounding"
18
 
19
 
 
 
 
 
 
 
 
 
 
 
 
 
 
20
  def initialize():
21
  """Initialize the application."""
22
  # Load models from file
@@ -68,8 +81,8 @@ def initialize():
68
  winner2_fn=lambda: select_winner("Evaluation 2", judge_manager),
69
  both_correct_fn=lambda: handle_both_correct(judge_manager),
70
  both_incorrect_fn=lambda: handle_both_incorrect(judge_manager),
71
- refresh_leaderboard_fn=lambda: judge_manager.leaderboard_df,
72
- leaderboard_df=judge_manager.leaderboard_df,
73
  )
74
 
75
  return ui.create_interface()
 
17
  current_test_type: str = "grounding"
18
 
19
 
20
+ def format_leaderboard_for_display(df: pd.DataFrame) -> pd.DataFrame:
21
+ """Format the leaderboard dataframe for display in the UI.
22
+ This ensures consistent display across environments like Huggingface Spaces."""
23
+ # Create a copy of the dataframe with only the columns we want to display
24
+ display_df = pd.DataFrame()
25
+ display_df["Judge Name"] = df["judge_name"]
26
+ display_df["ELO Score"] = df["elo_score"]
27
+ display_df["Wins"] = df["wins"]
28
+ display_df["Losses"] = df["losses"]
29
+ display_df["Total Evaluations"] = df["total_evaluations"]
30
+ return display_df
31
+
32
+
33
  def initialize():
34
  """Initialize the application."""
35
  # Load models from file
 
81
  winner2_fn=lambda: select_winner("Evaluation 2", judge_manager),
82
  both_correct_fn=lambda: handle_both_correct(judge_manager),
83
  both_incorrect_fn=lambda: handle_both_incorrect(judge_manager),
84
+ refresh_leaderboard_fn=lambda: format_leaderboard_for_display(judge_manager.leaderboard_df),
85
+ leaderboard_df=format_leaderboard_for_display(judge_manager.leaderboard_df),
86
  )
87
 
88
  return ui.create_interface()