Spaces:
Sleeping
Sleeping
Data page
Browse files- app/backend/data_engine.py +16 -2
app/backend/data_engine.py
CHANGED
|
@@ -113,6 +113,15 @@ class DataEngine:
|
|
| 113 |
for _, row in grouped_dataset_count.iterrows():
|
| 114 |
dataset_num_map[row["group_name"]] = row["dataset_name"]
|
| 115 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 116 |
grouped_model = df.groupby(["model_name", "group_name"]).agg({
|
| 117 |
"ndcg_at_10": "mean",
|
| 118 |
}).reset_index()
|
|
@@ -121,13 +130,18 @@ class DataEngine:
|
|
| 121 |
|
| 122 |
# Rename columns
|
| 123 |
pivot.columns = list(
|
| 124 |
-
map(lambda x: f"{x[1].capitalize()} Average ({dataset_num_map[x[1]]} datasets)" if x[
|
| 125 |
-
1] != 'text' else f"Average ({dataset_num_map[x[1]]} datasets)",
|
| 126 |
pivot.columns))
|
| 127 |
|
| 128 |
pivot_dataset = df_result.pivot(index="model_name", columns="dataset_name", values="ndcg_at_10")
|
| 129 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 130 |
df = pd.merge(df_model, pivot, on="model_name")
|
|
|
|
| 131 |
df = pd.merge(df, pivot_dataset, on="model_name")
|
| 132 |
|
| 133 |
if df.empty:
|
|
|
|
| 113 |
for _, row in grouped_dataset_count.iterrows():
|
| 114 |
dataset_num_map[row["group_name"]] = row["dataset_name"]
|
| 115 |
|
| 116 |
+
# Create a list of open datasets
|
| 117 |
+
open_datasets = []
|
| 118 |
+
for result in results_list:
|
| 119 |
+
if not result.get("is_closed", False):
|
| 120 |
+
open_datasets.append(result["dataset_name"])
|
| 121 |
+
|
| 122 |
+
# Count open datasets
|
| 123 |
+
open_dataset_count = len(open_datasets)
|
| 124 |
+
|
| 125 |
grouped_model = df.groupby(["model_name", "group_name"]).agg({
|
| 126 |
"ndcg_at_10": "mean",
|
| 127 |
}).reset_index()
|
|
|
|
| 130 |
|
| 131 |
# Rename columns
|
| 132 |
pivot.columns = list(
|
| 133 |
+
map(lambda x: f"{x[1].capitalize()} Average ({dataset_num_map[x[1]]} datasets)" if x[1] != 'text' else f"Average ({dataset_num_map[x[1]]} datasets)",
|
|
|
|
| 134 |
pivot.columns))
|
| 135 |
|
| 136 |
pivot_dataset = df_result.pivot(index="model_name", columns="dataset_name", values="ndcg_at_10")
|
| 137 |
|
| 138 |
+
# Calculate open average
|
| 139 |
+
open_df = df_result[df_result["dataset_name"].isin(open_datasets)]
|
| 140 |
+
open_avg = open_df.groupby("model_name")["ndcg_at_10"].mean().reset_index()
|
| 141 |
+
open_avg = open_avg.rename(columns={"ndcg_at_10": f"Open average ({open_dataset_count} datasets)"})
|
| 142 |
+
|
| 143 |
df = pd.merge(df_model, pivot, on="model_name")
|
| 144 |
+
df = pd.merge(df, open_avg, on="model_name")
|
| 145 |
df = pd.merge(df, pivot_dataset, on="model_name")
|
| 146 |
|
| 147 |
if df.empty:
|