Spaces:
Runtime error
Runtime error
jasonshaoshun commited on
Commit ·
55ba7bd
1
Parent(s): eaedb33
debug
Browse files- src/leaderboard/read_evals.py +26 -10
src/leaderboard/read_evals.py
CHANGED
|
@@ -286,10 +286,30 @@ class EvalResult_MIB_CAUSALGRAPH:
|
|
| 286 |
|
| 287 |
# return data_dict
|
| 288 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 289 |
def to_dict(self):
|
| 290 |
"""Converts the Eval Result to a dict for dataframe display"""
|
| 291 |
-
print(f"Results in to_dict: {self.results}") # Debug print
|
| 292 |
-
|
| 293 |
data_dict = {
|
| 294 |
"eval_name": self.eval_name,
|
| 295 |
"Method": self.method_name,
|
|
@@ -298,14 +318,10 @@ class EvalResult_MIB_CAUSALGRAPH:
|
|
| 298 |
# Process each model's results
|
| 299 |
for model_id, scores in self.results.items():
|
| 300 |
model_name = model_id.lower()
|
| 301 |
-
|
| 302 |
-
|
| 303 |
-
|
| 304 |
-
|
| 305 |
-
|
| 306 |
-
for intervention_data in intervention_scores:
|
| 307 |
-
col_name = f"{model_name}_layer{layer}_{intervention_data['intervention']}".lower()
|
| 308 |
-
data_dict[col_name] = intervention_data['score']
|
| 309 |
|
| 310 |
return data_dict
|
| 311 |
|
|
|
|
| 286 |
|
| 287 |
# return data_dict
|
| 288 |
|
| 289 |
+
# def to_dict(self):
|
| 290 |
+
# """Converts the Eval Result to a dict for dataframe display"""
|
| 291 |
+
# print(f"Results in to_dict: {self.results}") # Debug print
|
| 292 |
+
|
| 293 |
+
# data_dict = {
|
| 294 |
+
# "eval_name": self.eval_name,
|
| 295 |
+
# "Method": self.method_name,
|
| 296 |
+
# }
|
| 297 |
+
|
| 298 |
+
# # Process each model's results
|
| 299 |
+
# for model_id, scores in self.results.items():
|
| 300 |
+
# model_name = model_id.lower()
|
| 301 |
+
# for task, layer_scores in scores.items():
|
| 302 |
+
# for layer_data in layer_scores:
|
| 303 |
+
# layer = layer_data.get("layer")
|
| 304 |
+
# intervention_scores = layer_data.get("scores", [])
|
| 305 |
+
|
| 306 |
+
# for intervention_data in intervention_scores:
|
| 307 |
+
# col_name = f"{model_name}_layer{layer}_{intervention_data['intervention']}".lower()
|
| 308 |
+
# data_dict[col_name] = intervention_data['score']
|
| 309 |
+
|
| 310 |
+
# return data_dict
|
| 311 |
def to_dict(self):
|
| 312 |
"""Converts the Eval Result to a dict for dataframe display"""
|
|
|
|
|
|
|
| 313 |
data_dict = {
|
| 314 |
"eval_name": self.eval_name,
|
| 315 |
"Method": self.method_name,
|
|
|
|
| 318 |
# Process each model's results
|
| 319 |
for model_id, scores in self.results.items():
|
| 320 |
model_name = model_id.lower()
|
| 321 |
+
# The scores are already in the format we want
|
| 322 |
+
for key, value in scores.items():
|
| 323 |
+
col_name = f"{model_name}_{key}"
|
| 324 |
+
data_dict[col_name] = value
|
|
|
|
|
|
|
|
|
|
|
|
|
| 325 |
|
| 326 |
return data_dict
|
| 327 |
|