lestienne's picture
Add files using upload-large-folder tool
a967d9c verified
dataset,method,size,median,q1,q3,model,metric
20newsgroups,dp_calibration,8,0.7546407428,0.7338990779,0.8047618328,qwen2.5-7b-instruct,nce
20newsgroups,dp_calibration,16,0.6722159507000001,0.6698211084,0.676830939,qwen2.5-7b-instruct,nce
20newsgroups,dp_calibration,32,0.6430096215000001,0.6403825980000001,0.6511214839,qwen2.5-7b-instruct,nce
20newsgroups,dp_calibration,64,0.6289220125,0.6265720757000001,0.631040542,qwen2.5-7b-instruct,nce
20newsgroups,dp_calibration,128,0.6252026168,0.6250932114000001,0.6260644498,qwen2.5-7b-instruct,nce
20newsgroups,dp_calibration,256,0.6223887724,0.6219824888000001,0.6224369080000001,qwen2.5-7b-instruct,nce
20newsgroups,lora_1.0_no_es,8,0.8970295165000001,0.7341650795,1.151784799,qwen2.5-7b-instruct,nce
20newsgroups,lora_1.0_no_es,16,0.6817639091000001,0.6191390612000001,0.7082344190000001,qwen2.5-7b-instruct,nce
20newsgroups,lora_1.0_no_es,32,0.6072178758,0.5693403086000001,0.6446132967,qwen2.5-7b-instruct,nce
20newsgroups,lora_1.0_no_es,64,0.5854698319,0.5660984866000001,0.5988642388000001,qwen2.5-7b-instruct,nce
20newsgroups,lora_1.0_no_es,128,0.5330789077,0.5211436033,0.5584462306,qwen2.5-7b-instruct,nce
20newsgroups,lora_1.0_no_es,256,0.4908759883,0.4805303146,0.49917692890000004,qwen2.5-7b-instruct,nce
20newsgroups,lora_1.0_no_es_plus_tempscaling,8,0.5164427857,0.48580939240000004,0.5887411611000001,qwen2.5-7b-instruct,nce
20newsgroups,lora_1.0_no_es_plus_tempscaling,16,0.4153097787,0.38701372110000004,0.4217693354,qwen2.5-7b-instruct,nce
20newsgroups,lora_1.0_no_es_plus_tempscaling,32,0.3630036551,0.3588801407,0.3909213694,qwen2.5-7b-instruct,nce
20newsgroups,lora_1.0_no_es_plus_tempscaling,64,0.33619529340000004,0.3264030094,0.3373104462,qwen2.5-7b-instruct,nce
20newsgroups,lora_1.0_no_es_plus_tempscaling,128,0.3052118871,0.3036555081,0.3188620709,qwen2.5-7b-instruct,nce
20newsgroups,lora_1.0_no_es_plus_tempscaling,256,0.28938370820000003,0.28011730100000004,0.2893998508,qwen2.5-7b-instruct,nce
20newsgroups,no_adaptation,all,1.8155222332,1.8155222332,1.8155222332,qwen2.5-7b-instruct,nce
agnews,dp_calibration,8,0.5475612991000001,0.4308557295,5.1540645921,qwen2.5-7b-instruct,nce
agnews,dp_calibration,16,0.37575523980000003,0.3688441327,0.38479402020000003,qwen2.5-7b-instruct,nce
agnews,dp_calibration,32,0.3670299271,0.3629354594,0.3737943235,qwen2.5-7b-instruct,nce
agnews,dp_calibration,64,0.3630893481,0.3583663905,0.3684686372,qwen2.5-7b-instruct,nce
agnews,dp_calibration,128,0.3627221125,0.35768373400000003,0.36485945680000004,qwen2.5-7b-instruct,nce
agnews,dp_calibration,256,0.3600900656,0.35956136320000004,0.3618558266,qwen2.5-7b-instruct,nce
agnews,lora_1.0_no_es,8,0.40337454240000004,0.34410008200000003,0.5663038899,qwen2.5-7b-instruct,nce
agnews,lora_1.0_no_es,16,0.34303835380000003,0.3264562448,0.3911400108,qwen2.5-7b-instruct,nce
agnews,lora_1.0_no_es,32,0.34805550550000003,0.316641974,0.3716637875,qwen2.5-7b-instruct,nce
agnews,lora_1.0_no_es,64,0.3412170198,0.3103063056,0.353266397,qwen2.5-7b-instruct,nce
agnews,lora_1.0_no_es,128,0.3363076933,0.3060084903,0.3891033151,qwen2.5-7b-instruct,nce
agnews,lora_1.0_no_es,256,0.3833806171,0.3306922719,0.401552931,qwen2.5-7b-instruct,nce
agnews,lora_1.0_no_es_plus_tempscaling,8,0.8813786401,0.5663038884,2.8252298438,qwen2.5-7b-instruct,nce
agnews,lora_1.0_no_es_plus_tempscaling,16,0.2819799886,0.2114647891,0.462346197,qwen2.5-7b-instruct,nce
agnews,lora_1.0_no_es_plus_tempscaling,32,0.2040407394,0.20073165340000002,0.2487480343,qwen2.5-7b-instruct,nce
agnews,lora_1.0_no_es_plus_tempscaling,64,0.1843573212,0.18135832470000002,0.2402056629,qwen2.5-7b-instruct,nce
agnews,lora_1.0_no_es_plus_tempscaling,128,0.17588487730000002,0.16595165750000002,0.1952771271,qwen2.5-7b-instruct,nce
agnews,lora_1.0_no_es_plus_tempscaling,256,0.188050041,0.1838374452,0.19289939490000002,qwen2.5-7b-instruct,nce
agnews,no_adaptation,all,0.7804874617,0.7804874617,0.7804874617,qwen2.5-7b-instruct,nce
banking77,dp_calibration,8,0.9211202591000001,0.8969540282,0.9395120003,qwen2.5-7b-instruct,nce
banking77,dp_calibration,16,0.6924126717,0.688702176,0.7090195071000001,qwen2.5-7b-instruct,nce
banking77,dp_calibration,32,0.6080293509,0.6079581783,0.6174987147000001,qwen2.5-7b-instruct,nce
banking77,dp_calibration,64,0.5890287940000001,0.5869081101,0.5931369313,qwen2.5-7b-instruct,nce
banking77,dp_calibration,128,0.5788118008,0.5781138724,0.5804153826,qwen2.5-7b-instruct,nce
banking77,dp_calibration,256,0.5755764225000001,0.5743326591,0.5759252448000001,qwen2.5-7b-instruct,nce
banking77,lora_1.0_no_es,8,1.1526437873,1.133858138,1.2172204806,qwen2.5-7b-instruct,nce
banking77,lora_1.0_no_es,16,0.8376142773,0.7663219509,0.8430287544,qwen2.5-7b-instruct,nce
banking77,lora_1.0_no_es,32,0.431833061,0.3741628232,0.4744700187,qwen2.5-7b-instruct,nce
banking77,lora_1.0_no_es,64,0.2535351964,0.23965029570000002,0.2878752392,qwen2.5-7b-instruct,nce
banking77,lora_1.0_no_es,128,0.17637132490000001,0.17418127560000002,0.1827132079,qwen2.5-7b-instruct,nce
banking77,lora_1.0_no_es,256,0.1211115843,0.1160269002,0.1230462097,qwen2.5-7b-instruct,nce
banking77,lora_1.0_no_es_plus_tempscaling,8,0.5126252566,0.5087172014,0.5245015501,qwen2.5-7b-instruct,nce
banking77,lora_1.0_no_es_plus_tempscaling,16,0.3915767188,0.3773378858,0.39312194910000003,qwen2.5-7b-instruct,nce
banking77,lora_1.0_no_es_plus_tempscaling,32,0.2328782623,0.2287237182,0.2601202822,qwen2.5-7b-instruct,nce
banking77,lora_1.0_no_es_plus_tempscaling,64,0.1575941059,0.1511521726,0.1708726612,qwen2.5-7b-instruct,nce
banking77,lora_1.0_no_es_plus_tempscaling,128,0.1178169721,0.114955286,0.1224794936,qwen2.5-7b-instruct,nce
banking77,lora_1.0_no_es_plus_tempscaling,256,0.0954789776,0.09129492930000001,0.102971168,qwen2.5-7b-instruct,nce
banking77,no_adaptation,all,3.620646571,3.620646571,3.620646571,qwen2.5-7b-instruct,nce
dbpedia,dp_calibration,8,0.46647904900000003,0.4279377552,0.6477938087,qwen2.5-7b-instruct,nce
dbpedia,dp_calibration,16,0.3602248906,0.3429357467,0.3650911278,qwen2.5-7b-instruct,nce
dbpedia,dp_calibration,32,0.3198808405,0.3171919789,0.330171682,qwen2.5-7b-instruct,nce
dbpedia,dp_calibration,64,0.3122986887,0.30796754600000004,0.31843719470000004,qwen2.5-7b-instruct,nce
dbpedia,dp_calibration,128,0.3084408404,0.30647454080000003,0.3092564628,qwen2.5-7b-instruct,nce
dbpedia,dp_calibration,256,0.3045130057,0.3039342585,0.3074739521,qwen2.5-7b-instruct,nce
dbpedia,lora_1.0_no_es,8,0.0854842301,0.0818078181,0.2378510445,qwen2.5-7b-instruct,nce
dbpedia,lora_1.0_no_es,16,0.0238913501,0.0213010504,0.0317130754,qwen2.5-7b-instruct,nce
dbpedia,lora_1.0_no_es,32,0.023330053,0.0200872536,0.024519788600000002,qwen2.5-7b-instruct,nce
dbpedia,lora_1.0_no_es,64,0.0214499126,0.020564621,0.0216131826,qwen2.5-7b-instruct,nce
dbpedia,lora_1.0_no_es,128,0.019610381,0.0194516826,0.020471926300000002,qwen2.5-7b-instruct,nce
dbpedia,lora_1.0_no_es,256,0.0179246996,0.0175173316,0.021343073,qwen2.5-7b-instruct,nce
dbpedia,lora_1.0_no_es_plus_tempscaling,8,0.2109767494,0.0852541982,0.2221354599,qwen2.5-7b-instruct,nce
dbpedia,lora_1.0_no_es_plus_tempscaling,16,0.024701358200000002,0.023515019300000002,0.0390211745,qwen2.5-7b-instruct,nce
dbpedia,lora_1.0_no_es_plus_tempscaling,32,0.0218893949,0.0202724877,0.026834610000000002,qwen2.5-7b-instruct,nce
dbpedia,lora_1.0_no_es_plus_tempscaling,64,0.019806288000000002,0.018394005,0.0215219346,qwen2.5-7b-instruct,nce
dbpedia,lora_1.0_no_es_plus_tempscaling,128,0.020346316,0.0169711643,0.0213982321,qwen2.5-7b-instruct,nce
dbpedia,lora_1.0_no_es_plus_tempscaling,256,0.0146847382,0.013788605800000001,0.0172333126,qwen2.5-7b-instruct,nce
dbpedia,no_adaptation,all,2.2169198971,2.2169198971,2.2169198971,qwen2.5-7b-instruct,nce
sst2,dp_calibration,8,1.8578453731,0.5484148972,4.8035984745,qwen2.5-7b-instruct,nce
sst2,dp_calibration,16,0.4260125913,0.3331163405,3.4678246476,qwen2.5-7b-instruct,nce
sst2,dp_calibration,32,0.2101863343,0.2030086717,0.3538704279,qwen2.5-7b-instruct,nce
sst2,dp_calibration,64,0.2078482898,0.19890802970000002,0.2165603952,qwen2.5-7b-instruct,nce
sst2,dp_calibration,128,0.2023109472,0.2003097221,0.2062338649,qwen2.5-7b-instruct,nce
sst2,dp_calibration,256,0.2002892665,0.1989528511,0.2026887877,qwen2.5-7b-instruct,nce
sst2,lora_1.0_no_es,8,0.4607187232,0.4314848901,0.4856382273,qwen2.5-7b-instruct,nce
sst2,lora_1.0_no_es,16,0.44977507790000004,0.430824868,0.500663349,qwen2.5-7b-instruct,nce
sst2,lora_1.0_no_es,32,0.4223034915,0.39183229140000003,0.46554550570000003,qwen2.5-7b-instruct,nce
sst2,lora_1.0_no_es,64,0.43966463450000004,0.4099907151,0.483182404,qwen2.5-7b-instruct,nce
sst2,lora_1.0_no_es,128,0.4183330803,0.40817209930000004,0.4438870741,qwen2.5-7b-instruct,nce
sst2,lora_1.0_no_es,256,0.3979363261,0.3900455955,0.4254455446,qwen2.5-7b-instruct,nce
sst2,lora_1.0_no_es_plus_tempscaling,8,0.4762375547,0.4314848864,0.8747436196,qwen2.5-7b-instruct,nce
sst2,lora_1.0_no_es_plus_tempscaling,16,0.5261615692,0.4364734195,0.6054662234,qwen2.5-7b-instruct,nce
sst2,lora_1.0_no_es_plus_tempscaling,32,0.22529525600000003,0.21803730300000002,0.2436826967,qwen2.5-7b-instruct,nce
sst2,lora_1.0_no_es_plus_tempscaling,64,0.22126755620000002,0.2104355703,0.2409370089,qwen2.5-7b-instruct,nce
sst2,lora_1.0_no_es_plus_tempscaling,128,0.2123658578,0.2001110109,0.2189024068,qwen2.5-7b-instruct,nce
sst2,lora_1.0_no_es_plus_tempscaling,256,0.2011984275,0.1962976648,0.21163444920000002,qwen2.5-7b-instruct,nce
sst2,no_adaptation,all,0.3163844718,0.3163844718,0.3163844718,qwen2.5-7b-instruct,nce