Ray0202
update leaderboard
1dd52d9
from __future__ import annotations
from dataclasses import dataclass
@dataclass(frozen=True)
class TemporalBenchSchema:
identity_fields: tuple[str, ...] = (
"agent_name",
"agent_type",
"base_model",
)
required_metrics: tuple[str, ...] = (
"T1_acc",
"T2_acc",
"T3_acc",
"T4_acc",
)
optional_metrics: tuple[str, ...] = (
"overall_mcq_acc",
"T2_sMAPE",
"T2_MAE",
"T2_OW_sMAPE_MIMIC",
"T2_OW_RMSSE_MIMIC",
"T4_sMAPE",
"T4_MAE",
"T4_OW_sMAPE_MIMIC",
"T4_OW_RMSSE_MIMIC",
"FreshRetailNet_T1_acc",
"FreshRetailNet_T2_acc",
"FreshRetailNet_T3_acc",
"FreshRetailNet_T4_acc",
"PSML_T1_acc",
"PSML_T2_acc",
"PSML_T3_acc",
"PSML_T4_acc",
"CausalChambers_T1_acc",
"CausalChambers_T2_acc",
"CausalChambers_T3_acc",
"CausalChambers_T4_acc",
"MIMIC_T1_acc",
"MIMIC_T2_acc",
"MIMIC_T3_acc",
"MIMIC_T4_acc",
"FreshRetailNet_T2_sMAPE",
"FreshRetailNet_T2_MAE",
"PSML_T2_sMAPE",
"PSML_T2_MAE",
"CausalChambers_T2_sMAPE",
"CausalChambers_T2_MAE",
"MIMIC_T2_OW_sMAPE",
"MIMIC_T2_OW_RMSSE",
"FreshRetailNet_T4_sMAPE",
"FreshRetailNet_T4_MAE",
"PSML_T4_sMAPE",
"PSML_T4_MAE",
"CausalChambers_T4_sMAPE",
"CausalChambers_T4_MAE",
"MIMIC_T4_OW_sMAPE",
"MIMIC_T4_OW_RMSSE",
)
SCHEMA = TemporalBenchSchema()