danielrosehill commited on
Commit
7265315
·
1 Parent(s): 2e5e23f

Deduplicate leaderboard entries

Browse files
Files changed (1) hide show
  1. app.py +3 -0
app.py CHANGED
@@ -45,6 +45,8 @@ def create_leaderboard_df(benchmark_data):
45
  rows.append(row)
46
 
47
  df = pd.DataFrame(rows)
 
 
48
  # Sort by WER (lower is better)
49
  df = df.sort_values("WER (%)", ascending=True)
50
  return df
@@ -65,6 +67,7 @@ def create_punctuation_df(punct_data):
65
  rows.append(row)
66
 
67
  df = pd.DataFrame(rows)
 
68
  # Sort by overall score (higher is better)
69
  df = df.sort_values("Overall Score (%)", ascending=False)
70
  return df
 
45
  rows.append(row)
46
 
47
  df = pd.DataFrame(rows)
48
+ # Remove duplicate model/provider entries so each model shows once in the charts
49
+ df = df.drop_duplicates(subset=["Provider", "Model", "Type"], keep="first")
50
  # Sort by WER (lower is better)
51
  df = df.sort_values("WER (%)", ascending=True)
52
  return df
 
67
  rows.append(row)
68
 
69
  df = pd.DataFrame(rows)
70
+ df = df.drop_duplicates(subset=["Provider", "Model"], keep="first")
71
  # Sort by overall score (higher is better)
72
  df = df.sort_values("Overall Score (%)", ascending=False)
73
  return df