warlockee's picture
Upload folder using huggingface_hub
bd3ae0e verified
{
"n_splits": 20,
"n_smac": 569,
"n_llm": 195,
"results": [
{
"split": 0,
"policy": "SMAC",
"selector": "train_val_ap",
"deploy_eval_ap": 0.4570224663107674,
"top5_eval_ap": 0.554324263047066,
"oracle_eval_ap": 0.6992517338762682
},
{
"split": 0,
"policy": "SMAC",
"selector": "proxy_ap",
"deploy_eval_ap": 0.6701524418076312,
"top5_eval_ap": 0.686699506702746,
"oracle_eval_ap": 0.6992517338762682
},
{
"split": 0,
"policy": "SMAC",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.6721980222170849,
"top5_eval_ap": 0.6792901260791705,
"oracle_eval_ap": 0.6992517338762682
},
{
"split": 0,
"policy": "SMAC",
"selector": "proxy_brier",
"deploy_eval_ap": 0.6721980222170849,
"top5_eval_ap": 0.6792901260791705,
"oracle_eval_ap": 0.6992517338762682
},
{
"split": 0,
"policy": "SMAC",
"selector": "proxy_auc",
"deploy_eval_ap": 0.6792901260791705,
"top5_eval_ap": 0.6792901260791705,
"oracle_eval_ap": 0.6992517338762682
},
{
"split": 0,
"policy": "LLM",
"selector": "train_val_ap",
"deploy_eval_ap": 0.5233387623389887,
"top5_eval_ap": 0.5367247333545382,
"oracle_eval_ap": 0.5821468830123655
},
{
"split": 0,
"policy": "LLM",
"selector": "proxy_ap",
"deploy_eval_ap": 0.5710383254419367,
"top5_eval_ap": 0.5821468830123655,
"oracle_eval_ap": 0.5821468830123655
},
{
"split": 0,
"policy": "LLM",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.5246631981230342,
"top5_eval_ap": 0.5710383254419367,
"oracle_eval_ap": 0.5821468830123655
},
{
"split": 0,
"policy": "LLM",
"selector": "proxy_brier",
"deploy_eval_ap": 0.5710383254419367,
"top5_eval_ap": 0.5710383254419367,
"oracle_eval_ap": 0.5821468830123655
},
{
"split": 0,
"policy": "LLM",
"selector": "proxy_auc",
"deploy_eval_ap": 0.5821468830123655,
"top5_eval_ap": 0.5821468830123655,
"oracle_eval_ap": 0.5821468830123655
},
{
"split": 1,
"policy": "SMAC",
"selector": "train_val_ap",
"deploy_eval_ap": 0.46441448049443035,
"top5_eval_ap": 0.5270217679633087,
"oracle_eval_ap": 0.6763881841332537
},
{
"split": 1,
"policy": "SMAC",
"selector": "proxy_ap",
"deploy_eval_ap": 0.6373692361609227,
"top5_eval_ap": 0.6574063977544806,
"oracle_eval_ap": 0.6763881841332537
},
{
"split": 1,
"policy": "SMAC",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.6412953703595898,
"top5_eval_ap": 0.659747880337521,
"oracle_eval_ap": 0.6763881841332537
},
{
"split": 1,
"policy": "SMAC",
"selector": "proxy_brier",
"deploy_eval_ap": 0.659747880337521,
"top5_eval_ap": 0.659747880337521,
"oracle_eval_ap": 0.6763881841332537
},
{
"split": 1,
"policy": "SMAC",
"selector": "proxy_auc",
"deploy_eval_ap": 0.6549798755291265,
"top5_eval_ap": 0.659747880337521,
"oracle_eval_ap": 0.6763881841332537
},
{
"split": 1,
"policy": "LLM",
"selector": "train_val_ap",
"deploy_eval_ap": 0.5122126575807857,
"top5_eval_ap": 0.5309389698647801,
"oracle_eval_ap": 0.5676444796768093
},
{
"split": 1,
"policy": "LLM",
"selector": "proxy_ap",
"deploy_eval_ap": 0.5639179338971837,
"top5_eval_ap": 0.5676444796768093,
"oracle_eval_ap": 0.5676444796768093
},
{
"split": 1,
"policy": "LLM",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.5192059594256696,
"top5_eval_ap": 0.5639179338971837,
"oracle_eval_ap": 0.5676444796768093
},
{
"split": 1,
"policy": "LLM",
"selector": "proxy_brier",
"deploy_eval_ap": 0.5192059594256696,
"top5_eval_ap": 0.5639179338971837,
"oracle_eval_ap": 0.5676444796768093
},
{
"split": 1,
"policy": "LLM",
"selector": "proxy_auc",
"deploy_eval_ap": 0.5676444796768093,
"top5_eval_ap": 0.5676444796768093,
"oracle_eval_ap": 0.5676444796768093
},
{
"split": 2,
"policy": "SMAC",
"selector": "train_val_ap",
"deploy_eval_ap": 0.48153527880634006,
"top5_eval_ap": 0.583935038683602,
"oracle_eval_ap": 0.6990313570985696
},
{
"split": 2,
"policy": "SMAC",
"selector": "proxy_ap",
"deploy_eval_ap": 0.6623016702621187,
"top5_eval_ap": 0.6975191425541587,
"oracle_eval_ap": 0.6990313570985696
},
{
"split": 2,
"policy": "SMAC",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.6623016702621187,
"top5_eval_ap": 0.6668939043306413,
"oracle_eval_ap": 0.6990313570985696
},
{
"split": 2,
"policy": "SMAC",
"selector": "proxy_brier",
"deploy_eval_ap": 0.6623016702621187,
"top5_eval_ap": 0.6765853983546597,
"oracle_eval_ap": 0.6990313570985696
},
{
"split": 2,
"policy": "SMAC",
"selector": "proxy_auc",
"deploy_eval_ap": 0.6623016702621187,
"top5_eval_ap": 0.6872781185782315,
"oracle_eval_ap": 0.6990313570985696
},
{
"split": 2,
"policy": "LLM",
"selector": "train_val_ap",
"deploy_eval_ap": 0.5716335781219793,
"top5_eval_ap": 0.5924666754414817,
"oracle_eval_ap": 0.6303368424328526
},
{
"split": 2,
"policy": "LLM",
"selector": "proxy_ap",
"deploy_eval_ap": 0.6197933838977654,
"top5_eval_ap": 0.6303368424328526,
"oracle_eval_ap": 0.6303368424328526
},
{
"split": 2,
"policy": "LLM",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.5595467532159494,
"top5_eval_ap": 0.6303368424328526,
"oracle_eval_ap": 0.6303368424328526
},
{
"split": 2,
"policy": "LLM",
"selector": "proxy_brier",
"deploy_eval_ap": 0.5595467532159494,
"top5_eval_ap": 0.6303368424328526,
"oracle_eval_ap": 0.6303368424328526
},
{
"split": 2,
"policy": "LLM",
"selector": "proxy_auc",
"deploy_eval_ap": 0.5939967909066806,
"top5_eval_ap": 0.6197933838977654,
"oracle_eval_ap": 0.6303368424328526
},
{
"split": 3,
"policy": "SMAC",
"selector": "train_val_ap",
"deploy_eval_ap": 0.47686687736181266,
"top5_eval_ap": 0.5533094784532413,
"oracle_eval_ap": 0.699491642922994
},
{
"split": 3,
"policy": "SMAC",
"selector": "proxy_ap",
"deploy_eval_ap": 0.6670702453072503,
"top5_eval_ap": 0.6845344993452391,
"oracle_eval_ap": 0.699491642922994
},
{
"split": 3,
"policy": "SMAC",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.676851998605726,
"top5_eval_ap": 0.6973621765945375,
"oracle_eval_ap": 0.699491642922994
},
{
"split": 3,
"policy": "SMAC",
"selector": "proxy_brier",
"deploy_eval_ap": 0.676851998605726,
"top5_eval_ap": 0.6973621765945375,
"oracle_eval_ap": 0.699491642922994
},
{
"split": 3,
"policy": "SMAC",
"selector": "proxy_auc",
"deploy_eval_ap": 0.6973621765945375,
"top5_eval_ap": 0.6973621765945375,
"oracle_eval_ap": 0.699491642922994
},
{
"split": 3,
"policy": "LLM",
"selector": "train_val_ap",
"deploy_eval_ap": 0.5450044403166794,
"top5_eval_ap": 0.5532931874364065,
"oracle_eval_ap": 0.6134983686209221
},
{
"split": 3,
"policy": "LLM",
"selector": "proxy_ap",
"deploy_eval_ap": 0.5865040038295037,
"top5_eval_ap": 0.5865040038295037,
"oracle_eval_ap": 0.6134983686209221
},
{
"split": 3,
"policy": "LLM",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.5865040038295037,
"top5_eval_ap": 0.5865040038295037,
"oracle_eval_ap": 0.6134983686209221
},
{
"split": 3,
"policy": "LLM",
"selector": "proxy_brier",
"deploy_eval_ap": 0.5865040038295037,
"top5_eval_ap": 0.5865040038295037,
"oracle_eval_ap": 0.6134983686209221
},
{
"split": 3,
"policy": "LLM",
"selector": "proxy_auc",
"deploy_eval_ap": 0.5865040038295037,
"top5_eval_ap": 0.6134983686209221,
"oracle_eval_ap": 0.6134983686209221
},
{
"split": 4,
"policy": "SMAC",
"selector": "train_val_ap",
"deploy_eval_ap": 0.48965935913922864,
"top5_eval_ap": 0.5659805254448687,
"oracle_eval_ap": 0.6665470019333972
},
{
"split": 4,
"policy": "SMAC",
"selector": "proxy_ap",
"deploy_eval_ap": 0.6458410401680073,
"top5_eval_ap": 0.6538475606777989,
"oracle_eval_ap": 0.6665470019333972
},
{
"split": 4,
"policy": "SMAC",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.6458410401680073,
"top5_eval_ap": 0.6514671952126687,
"oracle_eval_ap": 0.6665470019333972
},
{
"split": 4,
"policy": "SMAC",
"selector": "proxy_brier",
"deploy_eval_ap": 0.6458410401680073,
"top5_eval_ap": 0.655507218656965,
"oracle_eval_ap": 0.6665470019333972
},
{
"split": 4,
"policy": "SMAC",
"selector": "proxy_auc",
"deploy_eval_ap": 0.655507218656965,
"top5_eval_ap": 0.655507218656965,
"oracle_eval_ap": 0.6665470019333972
},
{
"split": 4,
"policy": "LLM",
"selector": "train_val_ap",
"deploy_eval_ap": 0.5580722760115239,
"top5_eval_ap": 0.5769510779737405,
"oracle_eval_ap": 0.5996924034497422
},
{
"split": 4,
"policy": "LLM",
"selector": "proxy_ap",
"deploy_eval_ap": 0.5929810545795948,
"top5_eval_ap": 0.5996924034497422,
"oracle_eval_ap": 0.5996924034497422
},
{
"split": 4,
"policy": "LLM",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.5381143061930622,
"top5_eval_ap": 0.5996924034497422,
"oracle_eval_ap": 0.5996924034497422
},
{
"split": 4,
"policy": "LLM",
"selector": "proxy_brier",
"deploy_eval_ap": 0.5996924034497422,
"top5_eval_ap": 0.5996924034497422,
"oracle_eval_ap": 0.5996924034497422
},
{
"split": 4,
"policy": "LLM",
"selector": "proxy_auc",
"deploy_eval_ap": 0.5929810545795948,
"top5_eval_ap": 0.5996924034497422,
"oracle_eval_ap": 0.5996924034497422
},
{
"split": 5,
"policy": "SMAC",
"selector": "train_val_ap",
"deploy_eval_ap": 0.4766814331572886,
"top5_eval_ap": 0.5455312939524202,
"oracle_eval_ap": 0.7144895023760132
},
{
"split": 5,
"policy": "SMAC",
"selector": "proxy_ap",
"deploy_eval_ap": 0.6996238632035302,
"top5_eval_ap": 0.6996238632035302,
"oracle_eval_ap": 0.7144895023760132
},
{
"split": 5,
"policy": "SMAC",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.674811244678726,
"top5_eval_ap": 0.6889647183194441,
"oracle_eval_ap": 0.7144895023760132
},
{
"split": 5,
"policy": "SMAC",
"selector": "proxy_brier",
"deploy_eval_ap": 0.674811244678726,
"top5_eval_ap": 0.6794965240318673,
"oracle_eval_ap": 0.7144895023760132
},
{
"split": 5,
"policy": "SMAC",
"selector": "proxy_auc",
"deploy_eval_ap": 0.6893304832924366,
"top5_eval_ap": 0.707395115377764,
"oracle_eval_ap": 0.7144895023760132
},
{
"split": 5,
"policy": "LLM",
"selector": "train_val_ap",
"deploy_eval_ap": 0.5699660365691224,
"top5_eval_ap": 0.580786807367587,
"oracle_eval_ap": 0.6170531937027124
},
{
"split": 5,
"policy": "LLM",
"selector": "proxy_ap",
"deploy_eval_ap": 0.6110326280684486,
"top5_eval_ap": 0.6170531937027124,
"oracle_eval_ap": 0.6170531937027124
},
{
"split": 5,
"policy": "LLM",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.5636349935114392,
"top5_eval_ap": 0.6110326280684486,
"oracle_eval_ap": 0.6170531937027124
},
{
"split": 5,
"policy": "LLM",
"selector": "proxy_brier",
"deploy_eval_ap": 0.5636349935114392,
"top5_eval_ap": 0.6110326280684486,
"oracle_eval_ap": 0.6170531937027124
},
{
"split": 5,
"policy": "LLM",
"selector": "proxy_auc",
"deploy_eval_ap": 0.6170531937027124,
"top5_eval_ap": 0.6170531937027124,
"oracle_eval_ap": 0.6170531937027124
},
{
"split": 6,
"policy": "SMAC",
"selector": "train_val_ap",
"deploy_eval_ap": 0.46762743937652196,
"top5_eval_ap": 0.5497164805265882,
"oracle_eval_ap": 0.6613877313531714
},
{
"split": 6,
"policy": "SMAC",
"selector": "proxy_ap",
"deploy_eval_ap": 0.6363687839062333,
"top5_eval_ap": 0.6495101818993542,
"oracle_eval_ap": 0.6613877313531714
},
{
"split": 6,
"policy": "SMAC",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.6302792233786925,
"top5_eval_ap": 0.6449900714167096,
"oracle_eval_ap": 0.6613877313531714
},
{
"split": 6,
"policy": "SMAC",
"selector": "proxy_brier",
"deploy_eval_ap": 0.6218583151992617,
"top5_eval_ap": 0.6613877313531714,
"oracle_eval_ap": 0.6613877313531714
},
{
"split": 6,
"policy": "SMAC",
"selector": "proxy_auc",
"deploy_eval_ap": 0.6547087651871317,
"top5_eval_ap": 0.6547087651871317,
"oracle_eval_ap": 0.6613877313531714
},
{
"split": 6,
"policy": "LLM",
"selector": "train_val_ap",
"deploy_eval_ap": 0.5228096505652988,
"top5_eval_ap": 0.5472450405857392,
"oracle_eval_ap": 0.5820159930148319
},
{
"split": 6,
"policy": "LLM",
"selector": "proxy_ap",
"deploy_eval_ap": 0.5749494698388545,
"top5_eval_ap": 0.5820159930148319,
"oracle_eval_ap": 0.5820159930148319
},
{
"split": 6,
"policy": "LLM",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.5197841478683497,
"top5_eval_ap": 0.5820159930148319,
"oracle_eval_ap": 0.5820159930148319
},
{
"split": 6,
"policy": "LLM",
"selector": "proxy_brier",
"deploy_eval_ap": 0.5820159930148319,
"top5_eval_ap": 0.5820159930148319,
"oracle_eval_ap": 0.5820159930148319
},
{
"split": 6,
"policy": "LLM",
"selector": "proxy_auc",
"deploy_eval_ap": 0.5749494698388545,
"top5_eval_ap": 0.5749494698388545,
"oracle_eval_ap": 0.5820159930148319
},
{
"split": 7,
"policy": "SMAC",
"selector": "train_val_ap",
"deploy_eval_ap": 0.4655134540960533,
"top5_eval_ap": 0.522726926569494,
"oracle_eval_ap": 0.6861187649104927
},
{
"split": 7,
"policy": "SMAC",
"selector": "proxy_ap",
"deploy_eval_ap": 0.6644946516875663,
"top5_eval_ap": 0.6722847504543532,
"oracle_eval_ap": 0.6861187649104927
},
{
"split": 7,
"policy": "SMAC",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.6374107287330919,
"top5_eval_ap": 0.6575185205692705,
"oracle_eval_ap": 0.6861187649104927
},
{
"split": 7,
"policy": "SMAC",
"selector": "proxy_brier",
"deploy_eval_ap": 0.6374107287330919,
"top5_eval_ap": 0.6575185205692705,
"oracle_eval_ap": 0.6861187649104927
},
{
"split": 7,
"policy": "SMAC",
"selector": "proxy_auc",
"deploy_eval_ap": 0.6744851082264265,
"top5_eval_ap": 0.6744851082264265,
"oracle_eval_ap": 0.6861187649104927
},
{
"split": 7,
"policy": "LLM",
"selector": "train_val_ap",
"deploy_eval_ap": 0.5492889416845734,
"top5_eval_ap": 0.5597422907504639,
"oracle_eval_ap": 0.5881312754667634
},
{
"split": 7,
"policy": "LLM",
"selector": "proxy_ap",
"deploy_eval_ap": 0.5825149439259846,
"top5_eval_ap": 0.5881312754667634,
"oracle_eval_ap": 0.5881312754667634
},
{
"split": 7,
"policy": "LLM",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.5406230156355737,
"top5_eval_ap": 0.5825149439259846,
"oracle_eval_ap": 0.5881312754667634
},
{
"split": 7,
"policy": "LLM",
"selector": "proxy_brier",
"deploy_eval_ap": 0.5406230156355737,
"top5_eval_ap": 0.5825149439259846,
"oracle_eval_ap": 0.5881312754667634
},
{
"split": 7,
"policy": "LLM",
"selector": "proxy_auc",
"deploy_eval_ap": 0.5881312754667634,
"top5_eval_ap": 0.5881312754667634,
"oracle_eval_ap": 0.5881312754667634
},
{
"split": 8,
"policy": "SMAC",
"selector": "train_val_ap",
"deploy_eval_ap": 0.4671888729291876,
"top5_eval_ap": 0.5527941540405327,
"oracle_eval_ap": 0.6909129736754938
},
{
"split": 8,
"policy": "SMAC",
"selector": "proxy_ap",
"deploy_eval_ap": 0.6681493403214834,
"top5_eval_ap": 0.6858005151499248,
"oracle_eval_ap": 0.6909129736754938
},
{
"split": 8,
"policy": "SMAC",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.6613137040400633,
"top5_eval_ap": 0.675795982690935,
"oracle_eval_ap": 0.6909129736754938
},
{
"split": 8,
"policy": "SMAC",
"selector": "proxy_brier",
"deploy_eval_ap": 0.6613137040400633,
"top5_eval_ap": 0.675795982690935,
"oracle_eval_ap": 0.6909129736754938
},
{
"split": 8,
"policy": "SMAC",
"selector": "proxy_auc",
"deploy_eval_ap": 0.6681493403214834,
"top5_eval_ap": 0.675795982690935,
"oracle_eval_ap": 0.6909129736754938
},
{
"split": 8,
"policy": "LLM",
"selector": "train_val_ap",
"deploy_eval_ap": 0.5693244864895343,
"top5_eval_ap": 0.5780891113869431,
"oracle_eval_ap": 0.6174737647198649
},
{
"split": 8,
"policy": "LLM",
"selector": "proxy_ap",
"deploy_eval_ap": 0.6096789446505377,
"top5_eval_ap": 0.6174737647198649,
"oracle_eval_ap": 0.6174737647198649
},
{
"split": 8,
"policy": "LLM",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.5475975540445444,
"top5_eval_ap": 0.6096789446505377,
"oracle_eval_ap": 0.6174737647198649
},
{
"split": 8,
"policy": "LLM",
"selector": "proxy_brier",
"deploy_eval_ap": 0.5475975540445444,
"top5_eval_ap": 0.6096789446505377,
"oracle_eval_ap": 0.6174737647198649
},
{
"split": 8,
"policy": "LLM",
"selector": "proxy_auc",
"deploy_eval_ap": 0.6174737647198649,
"top5_eval_ap": 0.6174737647198649,
"oracle_eval_ap": 0.6174737647198649
},
{
"split": 9,
"policy": "SMAC",
"selector": "train_val_ap",
"deploy_eval_ap": 0.4647268261279126,
"top5_eval_ap": 0.5352504052738676,
"oracle_eval_ap": 0.6595143352252696
},
{
"split": 9,
"policy": "SMAC",
"selector": "proxy_ap",
"deploy_eval_ap": 0.6352649178425169,
"top5_eval_ap": 0.6469598871324141,
"oracle_eval_ap": 0.6595143352252696
},
{
"split": 9,
"policy": "SMAC",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.6383312189984667,
"top5_eval_ap": 0.6412995301486579,
"oracle_eval_ap": 0.6595143352252696
},
{
"split": 9,
"policy": "SMAC",
"selector": "proxy_brier",
"deploy_eval_ap": 0.6383312189984667,
"top5_eval_ap": 0.6412995301486579,
"oracle_eval_ap": 0.6595143352252696
},
{
"split": 9,
"policy": "SMAC",
"selector": "proxy_auc",
"deploy_eval_ap": 0.6412995301486579,
"top5_eval_ap": 0.6412995301486579,
"oracle_eval_ap": 0.6595143352252696
},
{
"split": 9,
"policy": "LLM",
"selector": "train_val_ap",
"deploy_eval_ap": 0.5591218602390743,
"top5_eval_ap": 0.5723850410583204,
"oracle_eval_ap": 0.6060849802997287
},
{
"split": 9,
"policy": "LLM",
"selector": "proxy_ap",
"deploy_eval_ap": 0.6026304288042699,
"top5_eval_ap": 0.6060849802997287,
"oracle_eval_ap": 0.6060849802997287
},
{
"split": 9,
"policy": "LLM",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.5630703886645162,
"top5_eval_ap": 0.6060849802997287,
"oracle_eval_ap": 0.6060849802997287
},
{
"split": 9,
"policy": "LLM",
"selector": "proxy_brier",
"deploy_eval_ap": 0.5630703886645162,
"top5_eval_ap": 0.6060849802997287,
"oracle_eval_ap": 0.6060849802997287
},
{
"split": 9,
"policy": "LLM",
"selector": "proxy_auc",
"deploy_eval_ap": 0.6026304288042699,
"top5_eval_ap": 0.6060849802997287,
"oracle_eval_ap": 0.6060849802997287
},
{
"split": 10,
"policy": "SMAC",
"selector": "train_val_ap",
"deploy_eval_ap": 0.43252556578138707,
"top5_eval_ap": 0.545737859838442,
"oracle_eval_ap": 0.6510920526336375
},
{
"split": 10,
"policy": "SMAC",
"selector": "proxy_ap",
"deploy_eval_ap": 0.6328251297478321,
"top5_eval_ap": 0.6328251297478321,
"oracle_eval_ap": 0.6510920526336375
},
{
"split": 10,
"policy": "SMAC",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.6269563345523465,
"top5_eval_ap": 0.6298090860067376,
"oracle_eval_ap": 0.6510920526336375
},
{
"split": 10,
"policy": "SMAC",
"selector": "proxy_brier",
"deploy_eval_ap": 0.6269563345523465,
"top5_eval_ap": 0.6298090860067376,
"oracle_eval_ap": 0.6510920526336375
},
{
"split": 10,
"policy": "SMAC",
"selector": "proxy_auc",
"deploy_eval_ap": 0.6298090860067376,
"top5_eval_ap": 0.6298090860067376,
"oracle_eval_ap": 0.6510920526336375
},
{
"split": 10,
"policy": "LLM",
"selector": "train_val_ap",
"deploy_eval_ap": 0.5107000309646199,
"top5_eval_ap": 0.5299460337513402,
"oracle_eval_ap": 0.5705619158989852
},
{
"split": 10,
"policy": "LLM",
"selector": "proxy_ap",
"deploy_eval_ap": 0.5396149215794253,
"top5_eval_ap": 0.5705619158989852,
"oracle_eval_ap": 0.5705619158989852
},
{
"split": 10,
"policy": "LLM",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.5177459209938902,
"top5_eval_ap": 0.5680304207869833,
"oracle_eval_ap": 0.5705619158989852
},
{
"split": 10,
"policy": "LLM",
"selector": "proxy_brier",
"deploy_eval_ap": 0.5680304207869833,
"top5_eval_ap": 0.5680304207869833,
"oracle_eval_ap": 0.5705619158989852
},
{
"split": 10,
"policy": "LLM",
"selector": "proxy_auc",
"deploy_eval_ap": 0.5489515867423438,
"top5_eval_ap": 0.5705619158989852,
"oracle_eval_ap": 0.5705619158989852
},
{
"split": 11,
"policy": "SMAC",
"selector": "train_val_ap",
"deploy_eval_ap": 0.4710269964771887,
"top5_eval_ap": 0.5467773233971552,
"oracle_eval_ap": 0.6719548100783407
},
{
"split": 11,
"policy": "SMAC",
"selector": "proxy_ap",
"deploy_eval_ap": 0.6594384456486362,
"top5_eval_ap": 0.6667222629479316,
"oracle_eval_ap": 0.6719548100783407
},
{
"split": 11,
"policy": "SMAC",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.6425104798363381,
"top5_eval_ap": 0.6594384456486362,
"oracle_eval_ap": 0.6719548100783407
},
{
"split": 11,
"policy": "SMAC",
"selector": "proxy_brier",
"deploy_eval_ap": 0.6425104798363381,
"top5_eval_ap": 0.6594384456486362,
"oracle_eval_ap": 0.6719548100783407
},
{
"split": 11,
"policy": "SMAC",
"selector": "proxy_auc",
"deploy_eval_ap": 0.6616147383178763,
"top5_eval_ap": 0.6667222629479316,
"oracle_eval_ap": 0.6719548100783407
},
{
"split": 11,
"policy": "LLM",
"selector": "train_val_ap",
"deploy_eval_ap": 0.5364096772470438,
"top5_eval_ap": 0.5543741202179301,
"oracle_eval_ap": 0.5968778721083486
},
{
"split": 11,
"policy": "LLM",
"selector": "proxy_ap",
"deploy_eval_ap": 0.5968778721083486,
"top5_eval_ap": 0.5968778721083486,
"oracle_eval_ap": 0.5968778721083486
},
{
"split": 11,
"policy": "LLM",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.5330398750639705,
"top5_eval_ap": 0.5960184148586979,
"oracle_eval_ap": 0.5968778721083486
},
{
"split": 11,
"policy": "LLM",
"selector": "proxy_brier",
"deploy_eval_ap": 0.5960184148586979,
"top5_eval_ap": 0.5960184148586979,
"oracle_eval_ap": 0.5968778721083486
},
{
"split": 11,
"policy": "LLM",
"selector": "proxy_auc",
"deploy_eval_ap": 0.5687816448742656,
"top5_eval_ap": 0.5968778721083486,
"oracle_eval_ap": 0.5968778721083486
},
{
"split": 12,
"policy": "SMAC",
"selector": "train_val_ap",
"deploy_eval_ap": 0.48477110005647617,
"top5_eval_ap": 0.5662010238381728,
"oracle_eval_ap": 0.6709011946518153
},
{
"split": 12,
"policy": "SMAC",
"selector": "proxy_ap",
"deploy_eval_ap": 0.6683911800553934,
"top5_eval_ap": 0.6683911800553934,
"oracle_eval_ap": 0.6709011946518153
},
{
"split": 12,
"policy": "SMAC",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.6537367742804812,
"top5_eval_ap": 0.655984953380698,
"oracle_eval_ap": 0.6709011946518153
},
{
"split": 12,
"policy": "SMAC",
"selector": "proxy_brier",
"deploy_eval_ap": 0.6537367742804812,
"top5_eval_ap": 0.655984953380698,
"oracle_eval_ap": 0.6709011946518153
},
{
"split": 12,
"policy": "SMAC",
"selector": "proxy_auc",
"deploy_eval_ap": 0.6558046451703515,
"top5_eval_ap": 0.6571243796655735,
"oracle_eval_ap": 0.6709011946518153
},
{
"split": 12,
"policy": "LLM",
"selector": "train_val_ap",
"deploy_eval_ap": 0.5571257414916191,
"top5_eval_ap": 0.5724004287234477,
"oracle_eval_ap": 0.6101282070029501
},
{
"split": 12,
"policy": "LLM",
"selector": "proxy_ap",
"deploy_eval_ap": 0.5923391898216597,
"top5_eval_ap": 0.6101282070029501,
"oracle_eval_ap": 0.6101282070029501
},
{
"split": 12,
"policy": "LLM",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.5534026034732688,
"top5_eval_ap": 0.6101282070029501,
"oracle_eval_ap": 0.6101282070029501
},
{
"split": 12,
"policy": "LLM",
"selector": "proxy_brier",
"deploy_eval_ap": 0.5534026034732688,
"top5_eval_ap": 0.6101282070029501,
"oracle_eval_ap": 0.6101282070029501
},
{
"split": 12,
"policy": "LLM",
"selector": "proxy_auc",
"deploy_eval_ap": 0.5923391898216597,
"top5_eval_ap": 0.5923391898216597,
"oracle_eval_ap": 0.6101282070029501
},
{
"split": 13,
"policy": "SMAC",
"selector": "train_val_ap",
"deploy_eval_ap": 0.46424878925358426,
"top5_eval_ap": 0.5526461047395709,
"oracle_eval_ap": 0.6596211026179731
},
{
"split": 13,
"policy": "SMAC",
"selector": "proxy_ap",
"deploy_eval_ap": 0.6423379220862562,
"top5_eval_ap": 0.6531102460331455,
"oracle_eval_ap": 0.6596211026179731
},
{
"split": 13,
"policy": "SMAC",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.6400759109195303,
"top5_eval_ap": 0.648796848874525,
"oracle_eval_ap": 0.6596211026179731
},
{
"split": 13,
"policy": "SMAC",
"selector": "proxy_brier",
"deploy_eval_ap": 0.6382008066612993,
"top5_eval_ap": 0.648796848874525,
"oracle_eval_ap": 0.6596211026179731
},
{
"split": 13,
"policy": "SMAC",
"selector": "proxy_auc",
"deploy_eval_ap": 0.6433876237385332,
"top5_eval_ap": 0.6596211026179731,
"oracle_eval_ap": 0.6596211026179731
},
{
"split": 13,
"policy": "LLM",
"selector": "train_val_ap",
"deploy_eval_ap": 0.5542102452808897,
"top5_eval_ap": 0.5713349471167026,
"oracle_eval_ap": 0.6101575436136442
},
{
"split": 13,
"policy": "LLM",
"selector": "proxy_ap",
"deploy_eval_ap": 0.597567237938185,
"top5_eval_ap": 0.6101575436136442,
"oracle_eval_ap": 0.6101575436136442
},
{
"split": 13,
"policy": "LLM",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.5560502121944897,
"top5_eval_ap": 0.6101575436136442,
"oracle_eval_ap": 0.6101575436136442
},
{
"split": 13,
"policy": "LLM",
"selector": "proxy_brier",
"deploy_eval_ap": 0.5560502121944897,
"top5_eval_ap": 0.6101575436136442,
"oracle_eval_ap": 0.6101575436136442
},
{
"split": 13,
"policy": "LLM",
"selector": "proxy_auc",
"deploy_eval_ap": 0.597567237938185,
"top5_eval_ap": 0.597567237938185,
"oracle_eval_ap": 0.6101575436136442
},
{
"split": 14,
"policy": "SMAC",
"selector": "train_val_ap",
"deploy_eval_ap": 0.48573170965343504,
"top5_eval_ap": 0.5571016213991584,
"oracle_eval_ap": 0.706811019289939
},
{
"split": 14,
"policy": "SMAC",
"selector": "proxy_ap",
"deploy_eval_ap": 0.677433995089546,
"top5_eval_ap": 0.6986598664783432,
"oracle_eval_ap": 0.706811019289939
},
{
"split": 14,
"policy": "SMAC",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.6743009496363566,
"top5_eval_ap": 0.6970399756161322,
"oracle_eval_ap": 0.706811019289939
},
{
"split": 14,
"policy": "SMAC",
"selector": "proxy_brier",
"deploy_eval_ap": 0.6743009496363566,
"top5_eval_ap": 0.6970399756161322,
"oracle_eval_ap": 0.706811019289939
},
{
"split": 14,
"policy": "SMAC",
"selector": "proxy_auc",
"deploy_eval_ap": 0.706811019289939,
"top5_eval_ap": 0.706811019289939,
"oracle_eval_ap": 0.706811019289939
},
{
"split": 14,
"policy": "LLM",
"selector": "train_val_ap",
"deploy_eval_ap": 0.5576376597054382,
"top5_eval_ap": 0.5669921922681518,
"oracle_eval_ap": 0.6436329100802731
},
{
"split": 14,
"policy": "LLM",
"selector": "proxy_ap",
"deploy_eval_ap": 0.6115519107659961,
"top5_eval_ap": 0.6115519107659961,
"oracle_eval_ap": 0.6436329100802731
},
{
"split": 14,
"policy": "LLM",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.5543941938024801,
"top5_eval_ap": 0.6115519107659961,
"oracle_eval_ap": 0.6436329100802731
},
{
"split": 14,
"policy": "LLM",
"selector": "proxy_brier",
"deploy_eval_ap": 0.5543941938024801,
"top5_eval_ap": 0.6115519107659961,
"oracle_eval_ap": 0.6436329100802731
},
{
"split": 14,
"policy": "LLM",
"selector": "proxy_auc",
"deploy_eval_ap": 0.5930515876054733,
"top5_eval_ap": 0.6436329100802731,
"oracle_eval_ap": 0.6436329100802731
},
{
"split": 15,
"policy": "SMAC",
"selector": "train_val_ap",
"deploy_eval_ap": 0.478137602574508,
"top5_eval_ap": 0.6035334495920432,
"oracle_eval_ap": 0.6907808119723886
},
{
"split": 15,
"policy": "SMAC",
"selector": "proxy_ap",
"deploy_eval_ap": 0.6585420344863675,
"top5_eval_ap": 0.6626179830682002,
"oracle_eval_ap": 0.6907808119723886
},
{
"split": 15,
"policy": "SMAC",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.6488358732455428,
"top5_eval_ap": 0.6585420344863675,
"oracle_eval_ap": 0.6907808119723886
},
{
"split": 15,
"policy": "SMAC",
"selector": "proxy_brier",
"deploy_eval_ap": 0.6488358732455428,
"top5_eval_ap": 0.6585420344863675,
"oracle_eval_ap": 0.6907808119723886
},
{
"split": 15,
"policy": "SMAC",
"selector": "proxy_auc",
"deploy_eval_ap": 0.6526664898991454,
"top5_eval_ap": 0.6626179830682002,
"oracle_eval_ap": 0.6907808119723886
},
{
"split": 15,
"policy": "LLM",
"selector": "train_val_ap",
"deploy_eval_ap": 0.5263984758406471,
"top5_eval_ap": 0.5405265639280998,
"oracle_eval_ap": 0.5941351543506521
},
{
"split": 15,
"policy": "LLM",
"selector": "proxy_ap",
"deploy_eval_ap": 0.5757554508817501,
"top5_eval_ap": 0.5941351543506521,
"oracle_eval_ap": 0.5941351543506521
},
{
"split": 15,
"policy": "LLM",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.5757554508817501,
"top5_eval_ap": 0.5757554508817501,
"oracle_eval_ap": 0.5941351543506521
},
{
"split": 15,
"policy": "LLM",
"selector": "proxy_brier",
"deploy_eval_ap": 0.5757554508817501,
"top5_eval_ap": 0.5757554508817501,
"oracle_eval_ap": 0.5941351543506521
},
{
"split": 15,
"policy": "LLM",
"selector": "proxy_auc",
"deploy_eval_ap": 0.5609746889071622,
"top5_eval_ap": 0.5941351543506521,
"oracle_eval_ap": 0.5941351543506521
},
{
"split": 16,
"policy": "SMAC",
"selector": "train_val_ap",
"deploy_eval_ap": 0.48347433637766246,
"top5_eval_ap": 0.5542497960909861,
"oracle_eval_ap": 0.6792151940442446
},
{
"split": 16,
"policy": "SMAC",
"selector": "proxy_ap",
"deploy_eval_ap": 0.6704260223189045,
"top5_eval_ap": 0.6704260223189045,
"oracle_eval_ap": 0.6792151940442446
},
{
"split": 16,
"policy": "SMAC",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.6496261958623482,
"top5_eval_ap": 0.667923356262339,
"oracle_eval_ap": 0.6792151940442446
},
{
"split": 16,
"policy": "SMAC",
"selector": "proxy_brier",
"deploy_eval_ap": 0.6538902227589642,
"top5_eval_ap": 0.657860437409312,
"oracle_eval_ap": 0.6792151940442446
},
{
"split": 16,
"policy": "SMAC",
"selector": "proxy_auc",
"deploy_eval_ap": 0.6519335091567344,
"top5_eval_ap": 0.6792151940442446,
"oracle_eval_ap": 0.6792151940442446
},
{
"split": 16,
"policy": "LLM",
"selector": "train_val_ap",
"deploy_eval_ap": 0.5416059436051286,
"top5_eval_ap": 0.5600151915305791,
"oracle_eval_ap": 0.5932504427370535
},
{
"split": 16,
"policy": "LLM",
"selector": "proxy_ap",
"deploy_eval_ap": 0.5850524686308571,
"top5_eval_ap": 0.5932504427370535,
"oracle_eval_ap": 0.5932504427370535
},
{
"split": 16,
"policy": "LLM",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.5327389623147321,
"top5_eval_ap": 0.5932504427370535,
"oracle_eval_ap": 0.5932504427370535
},
{
"split": 16,
"policy": "LLM",
"selector": "proxy_brier",
"deploy_eval_ap": 0.5932504427370535,
"top5_eval_ap": 0.5932504427370535,
"oracle_eval_ap": 0.5932504427370535
},
{
"split": 16,
"policy": "LLM",
"selector": "proxy_auc",
"deploy_eval_ap": 0.5850524686308571,
"top5_eval_ap": 0.5850524686308571,
"oracle_eval_ap": 0.5932504427370535
},
{
"split": 17,
"policy": "SMAC",
"selector": "train_val_ap",
"deploy_eval_ap": 0.4649606317608773,
"top5_eval_ap": 0.5340079584689927,
"oracle_eval_ap": 0.6649893230620163
},
{
"split": 17,
"policy": "SMAC",
"selector": "proxy_ap",
"deploy_eval_ap": 0.6428038478697953,
"top5_eval_ap": 0.6539513241791239,
"oracle_eval_ap": 0.6649893230620163
},
{
"split": 17,
"policy": "SMAC",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.6428038478697953,
"top5_eval_ap": 0.6629995698938378,
"oracle_eval_ap": 0.6649893230620163
},
{
"split": 17,
"policy": "SMAC",
"selector": "proxy_brier",
"deploy_eval_ap": 0.6428038478697953,
"top5_eval_ap": 0.6456547506299378,
"oracle_eval_ap": 0.6649893230620163
},
{
"split": 17,
"policy": "SMAC",
"selector": "proxy_auc",
"deploy_eval_ap": 0.6456547506299378,
"top5_eval_ap": 0.6649893230620163,
"oracle_eval_ap": 0.6649893230620163
},
{
"split": 17,
"policy": "LLM",
"selector": "train_val_ap",
"deploy_eval_ap": 0.5348676749866335,
"top5_eval_ap": 0.5446056544806404,
"oracle_eval_ap": 0.579352918072389
},
{
"split": 17,
"policy": "LLM",
"selector": "proxy_ap",
"deploy_eval_ap": 0.5718675106734894,
"top5_eval_ap": 0.579352918072389,
"oracle_eval_ap": 0.579352918072389
},
{
"split": 17,
"policy": "LLM",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.5261790671930053,
"top5_eval_ap": 0.579352918072389,
"oracle_eval_ap": 0.579352918072389
},
{
"split": 17,
"policy": "LLM",
"selector": "proxy_brier",
"deploy_eval_ap": 0.5261790671930053,
"top5_eval_ap": 0.579352918072389,
"oracle_eval_ap": 0.579352918072389
},
{
"split": 17,
"policy": "LLM",
"selector": "proxy_auc",
"deploy_eval_ap": 0.5718675106734894,
"top5_eval_ap": 0.579352918072389,
"oracle_eval_ap": 0.579352918072389
},
{
"split": 18,
"policy": "SMAC",
"selector": "train_val_ap",
"deploy_eval_ap": 0.4531073060880456,
"top5_eval_ap": 0.5436616702921386,
"oracle_eval_ap": 0.6838512120663813
},
{
"split": 18,
"policy": "SMAC",
"selector": "proxy_ap",
"deploy_eval_ap": 0.6223927371229265,
"top5_eval_ap": 0.6648512526938274,
"oracle_eval_ap": 0.6838512120663813
},
{
"split": 18,
"policy": "SMAC",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.654015043616063,
"top5_eval_ap": 0.6638824217815192,
"oracle_eval_ap": 0.6838512120663813
},
{
"split": 18,
"policy": "SMAC",
"selector": "proxy_brier",
"deploy_eval_ap": 0.654015043616063,
"top5_eval_ap": 0.6638824217815192,
"oracle_eval_ap": 0.6838512120663813
},
{
"split": 18,
"policy": "SMAC",
"selector": "proxy_auc",
"deploy_eval_ap": 0.6648512526938274,
"top5_eval_ap": 0.6648512526938274,
"oracle_eval_ap": 0.6838512120663813
},
{
"split": 18,
"policy": "LLM",
"selector": "train_val_ap",
"deploy_eval_ap": 0.5120617315361997,
"top5_eval_ap": 0.5365263833358878,
"oracle_eval_ap": 0.578623298812676
},
{
"split": 18,
"policy": "LLM",
"selector": "proxy_ap",
"deploy_eval_ap": 0.5664905732884257,
"top5_eval_ap": 0.578623298812676,
"oracle_eval_ap": 0.578623298812676
},
{
"split": 18,
"policy": "LLM",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.5141500314699055,
"top5_eval_ap": 0.5664905732884257,
"oracle_eval_ap": 0.578623298812676
},
{
"split": 18,
"policy": "LLM",
"selector": "proxy_brier",
"deploy_eval_ap": 0.5664905732884257,
"top5_eval_ap": 0.5664905732884257,
"oracle_eval_ap": 0.578623298812676
},
{
"split": 18,
"policy": "LLM",
"selector": "proxy_auc",
"deploy_eval_ap": 0.5458621922252527,
"top5_eval_ap": 0.578623298812676,
"oracle_eval_ap": 0.578623298812676
},
{
"split": 19,
"policy": "SMAC",
"selector": "train_val_ap",
"deploy_eval_ap": 0.44407823183784984,
"top5_eval_ap": 0.5488701040645936,
"oracle_eval_ap": 0.6512634701693791
},
{
"split": 19,
"policy": "SMAC",
"selector": "proxy_ap",
"deploy_eval_ap": 0.6216870554572433,
"top5_eval_ap": 0.6460088873809331,
"oracle_eval_ap": 0.6512634701693791
},
{
"split": 19,
"policy": "SMAC",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.6216870554572433,
"top5_eval_ap": 0.6216870554572433,
"oracle_eval_ap": 0.6512634701693791
},
{
"split": 19,
"policy": "SMAC",
"selector": "proxy_brier",
"deploy_eval_ap": 0.6216870554572433,
"top5_eval_ap": 0.6216870554572433,
"oracle_eval_ap": 0.6512634701693791
},
{
"split": 19,
"policy": "SMAC",
"selector": "proxy_auc",
"deploy_eval_ap": 0.630631866544245,
"top5_eval_ap": 0.630631866544245,
"oracle_eval_ap": 0.6512634701693791
},
{
"split": 19,
"policy": "LLM",
"selector": "train_val_ap",
"deploy_eval_ap": 0.5381205484033079,
"top5_eval_ap": 0.5467457949477925,
"oracle_eval_ap": 0.5795121120881965
},
{
"split": 19,
"policy": "LLM",
"selector": "proxy_ap",
"deploy_eval_ap": 0.5690007856001769,
"top5_eval_ap": 0.5791181610505296,
"oracle_eval_ap": 0.5795121120881965
},
{
"split": 19,
"policy": "LLM",
"selector": "proxy_logloss",
"deploy_eval_ap": 0.5213055580115359,
"top5_eval_ap": 0.5791181610505296,
"oracle_eval_ap": 0.5795121120881965
},
{
"split": 19,
"policy": "LLM",
"selector": "proxy_brier",
"deploy_eval_ap": 0.5791181610505296,
"top5_eval_ap": 0.5791181610505296,
"oracle_eval_ap": 0.5795121120881965
},
{
"split": 19,
"policy": "LLM",
"selector": "proxy_auc",
"deploy_eval_ap": 0.5690007856001769,
"top5_eval_ap": 0.5795121120881965,
"oracle_eval_ap": 0.5795121120881965
}
]
}