File size: 9,525 Bytes
a967d9c
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
dataset,method,size,median,q1,q3,model,metric
20newsgroups,dp_calibration,8,0.6515353805,0.6368491322000001,0.6542056075,qwen2.5-7b-instruct,ner
20newsgroups,dp_calibration,16,0.5861148198,0.5647530040000001,0.6021361816,qwen2.5-7b-instruct,ner
20newsgroups,dp_calibration,32,0.5540720961,0.5367156208,0.5767690254,qwen2.5-7b-instruct,ner
20newsgroups,dp_calibration,64,0.5393858478,0.5380507343,0.5660881175,qwen2.5-7b-instruct,ner
20newsgroups,dp_calibration,128,0.5473965287,0.5420560748000001,0.5527369826,qwen2.5-7b-instruct,ner
20newsgroups,dp_calibration,256,0.5420560748000001,0.5420560748000001,0.5460614152000001,qwen2.5-7b-instruct,ner
20newsgroups,lora_1.0_no_es,8,0.4419225634,0.3925233645,0.4686248331,qwen2.5-7b-instruct,ner
20newsgroups,lora_1.0_no_es,16,0.39652870490000003,0.3751668892,0.3978638184,qwen2.5-7b-instruct,ner
20newsgroups,lora_1.0_no_es,32,0.3391188251,0.3230974633,0.3484646195,qwen2.5-7b-instruct,ner
20newsgroups,lora_1.0_no_es,64,0.3097463284,0.308411215,0.31108144190000003,qwen2.5-7b-instruct,ner
20newsgroups,lora_1.0_no_es,128,0.2883845127,0.28437917220000003,0.2897196262,qwen2.5-7b-instruct,ner
20newsgroups,lora_1.0_no_es,256,0.2723631509,0.2550066756,0.2763684913,qwen2.5-7b-instruct,ner
20newsgroups,lora_1.0_no_es_plus_tempscaling,8,0.4419225634,0.3925233645,0.4686248331,qwen2.5-7b-instruct,ner
20newsgroups,lora_1.0_no_es_plus_tempscaling,16,0.39652870490000003,0.3751668892,0.3978638184,qwen2.5-7b-instruct,ner
20newsgroups,lora_1.0_no_es_plus_tempscaling,32,0.3391188251,0.3230974633,0.3484646195,qwen2.5-7b-instruct,ner
20newsgroups,lora_1.0_no_es_plus_tempscaling,64,0.3097463284,0.308411215,0.31108144190000003,qwen2.5-7b-instruct,ner
20newsgroups,lora_1.0_no_es_plus_tempscaling,128,0.2883845127,0.28437917220000003,0.2897196262,qwen2.5-7b-instruct,ner
20newsgroups,lora_1.0_no_es_plus_tempscaling,256,0.2723631509,0.2550066756,0.2763684913,qwen2.5-7b-instruct,ner
20newsgroups,no_adaptation,all,0.7983978638,0.7983978638,0.7983978638,qwen2.5-7b-instruct,ner
agnews,dp_calibration,8,0.2440677966,0.2305084746,0.2881355932,qwen2.5-7b-instruct,ner
agnews,dp_calibration,16,0.2305084746,0.21694915250000002,0.2440677966,qwen2.5-7b-instruct,ner
agnews,dp_calibration,32,0.2305084746,0.21355932200000002,0.2406779661,qwen2.5-7b-instruct,ner
agnews,dp_calibration,64,0.2305084746,0.2305084746,0.2338983051,qwen2.5-7b-instruct,ner
agnews,dp_calibration,128,0.2203389831,0.21694915250000002,0.2305084746,qwen2.5-7b-instruct,ner
agnews,dp_calibration,256,0.21355932200000002,0.21355932200000002,0.22711864410000002,qwen2.5-7b-instruct,ner
agnews,lora_1.0_no_es,8,0.19322033900000002,0.1355932203,0.22372881360000002,qwen2.5-7b-instruct,ner
agnews,lora_1.0_no_es,16,0.1457627119,0.1288135593,0.1694915254,qwen2.5-7b-instruct,ner
agnews,lora_1.0_no_es,32,0.1288135593,0.11186440680000001,0.1355932203,qwen2.5-7b-instruct,ner
agnews,lora_1.0_no_es,64,0.1186440678,0.1050847458,0.1220338983,qwen2.5-7b-instruct,ner
agnews,lora_1.0_no_es,128,0.11186440680000001,0.1050847458,0.11186440680000001,qwen2.5-7b-instruct,ner
agnews,lora_1.0_no_es,256,0.10169491530000001,0.0915254237,0.1152542373,qwen2.5-7b-instruct,ner
agnews,lora_1.0_no_es_plus_tempscaling,8,0.19322033900000002,0.1355932203,0.22372881360000002,qwen2.5-7b-instruct,ner
agnews,lora_1.0_no_es_plus_tempscaling,16,0.1457627119,0.1288135593,0.1694915254,qwen2.5-7b-instruct,ner
agnews,lora_1.0_no_es_plus_tempscaling,32,0.1288135593,0.11186440680000001,0.1355932203,qwen2.5-7b-instruct,ner
agnews,lora_1.0_no_es_plus_tempscaling,64,0.1186440678,0.1050847458,0.1220338983,qwen2.5-7b-instruct,ner
agnews,lora_1.0_no_es_plus_tempscaling,128,0.11186440680000001,0.1050847458,0.11186440680000001,qwen2.5-7b-instruct,ner
agnews,lora_1.0_no_es_plus_tempscaling,256,0.10169491530000001,0.0915254237,0.1152542373,qwen2.5-7b-instruct,ner
agnews,no_adaptation,all,0.2745762712,0.2745762712,0.2745762712,qwen2.5-7b-instruct,ner
banking77,dp_calibration,8,0.7109295199,0.6884576098,0.7109295199,qwen2.5-7b-instruct,ner
banking77,dp_calibration,16,0.6486210419,0.6373850868000001,0.6506639428000001,qwen2.5-7b-instruct,ner
banking77,dp_calibration,32,0.6016343207,0.5965270684,0.6138917263,qwen2.5-7b-instruct,ner
banking77,dp_calibration,64,0.582226762,0.5791624106000001,0.5832482125,qwen2.5-7b-instruct,ner
banking77,dp_calibration,128,0.5699693565,0.568947906,0.5720122574000001,qwen2.5-7b-instruct,ner
banking77,dp_calibration,256,0.5617977528,0.5607763023,0.5638406537,qwen2.5-7b-instruct,ner
banking77,lora_1.0_no_es,8,0.5076608784000001,0.4994892748,0.5362614913,qwen2.5-7b-instruct,ner
banking77,lora_1.0_no_es,16,0.3830439224,0.37793667010000004,0.40347293160000003,qwen2.5-7b-instruct,ner
banking77,lora_1.0_no_es,32,0.26353421860000004,0.26353421860000004,0.2717058223,qwen2.5-7b-instruct,ner
banking77,lora_1.0_no_es,64,0.19407558730000002,0.1818181818,0.19713993870000002,qwen2.5-7b-instruct,ner
banking77,lora_1.0_no_es,128,0.1440245148,0.1409601634,0.1440245148,qwen2.5-7b-instruct,ner
banking77,lora_1.0_no_es,256,0.1113381001,0.1082737487,0.1297242084,qwen2.5-7b-instruct,ner
banking77,lora_1.0_no_es_plus_tempscaling,8,0.5076608784000001,0.4994892748,0.5362614913,qwen2.5-7b-instruct,ner
banking77,lora_1.0_no_es_plus_tempscaling,16,0.3830439224,0.37793667010000004,0.40347293160000003,qwen2.5-7b-instruct,ner
banking77,lora_1.0_no_es_plus_tempscaling,32,0.26353421860000004,0.26353421860000004,0.2717058223,qwen2.5-7b-instruct,ner
banking77,lora_1.0_no_es_plus_tempscaling,64,0.19407558730000002,0.1818181818,0.19713993870000002,qwen2.5-7b-instruct,ner
banking77,lora_1.0_no_es_plus_tempscaling,128,0.1440245148,0.1409601634,0.1440245148,qwen2.5-7b-instruct,ner
banking77,lora_1.0_no_es_plus_tempscaling,256,0.1113381001,0.1082737487,0.1297242084,qwen2.5-7b-instruct,ner
banking77,no_adaptation,all,0.8621041879,0.8621041879,0.8621041879,qwen2.5-7b-instruct,ner
dbpedia,dp_calibration,8,0.33491311220000003,0.3206951027,0.3396524487,qwen2.5-7b-instruct,ner
dbpedia,dp_calibration,16,0.2859399684,0.2812006319,0.2875197472,qwen2.5-7b-instruct,ner
dbpedia,dp_calibration,32,0.2654028436,0.2575039494,0.2733017378,qwen2.5-7b-instruct,ner
dbpedia,dp_calibration,64,0.252764613,0.2464454976,0.2622432859,qwen2.5-7b-instruct,ner
dbpedia,dp_calibration,128,0.2559241706,0.2543443918,0.2622432859,qwen2.5-7b-instruct,ner
dbpedia,dp_calibration,256,0.2543443918,0.2543443918,0.2559241706,qwen2.5-7b-instruct,ner
dbpedia,lora_1.0_no_es,8,0.0821484992,0.0663507109,0.1042654028,qwen2.5-7b-instruct,ner
dbpedia,lora_1.0_no_es,16,0.0173775671,0.0142180095,0.0252764613,qwen2.5-7b-instruct,ner
dbpedia,lora_1.0_no_es,32,0.0142180095,0.0142180095,0.0157977883,qwen2.5-7b-instruct,ner
dbpedia,lora_1.0_no_es,64,0.0126382306,0.0110584518,0.0126382306,qwen2.5-7b-instruct,ner
dbpedia,lora_1.0_no_es,128,0.009478673,0.009478673,0.009478673,qwen2.5-7b-instruct,ner
dbpedia,lora_1.0_no_es,256,0.009478673,0.0063191153,0.009478673,qwen2.5-7b-instruct,ner
dbpedia,lora_1.0_no_es_plus_tempscaling,8,0.0821484992,0.0663507109,0.1042654028,qwen2.5-7b-instruct,ner
dbpedia,lora_1.0_no_es_plus_tempscaling,16,0.0173775671,0.0142180095,0.0252764613,qwen2.5-7b-instruct,ner
dbpedia,lora_1.0_no_es_plus_tempscaling,32,0.0142180095,0.0142180095,0.0157977883,qwen2.5-7b-instruct,ner
dbpedia,lora_1.0_no_es_plus_tempscaling,64,0.0126382306,0.0110584518,0.0126382306,qwen2.5-7b-instruct,ner
dbpedia,lora_1.0_no_es_plus_tempscaling,128,0.009478673,0.009478673,0.009478673,qwen2.5-7b-instruct,ner
dbpedia,lora_1.0_no_es_plus_tempscaling,256,0.009478673,0.0063191153,0.009478673,qwen2.5-7b-instruct,ner
dbpedia,no_adaptation,all,0.3854660348,0.3854660348,0.3854660348,qwen2.5-7b-instruct,ner
sst2,dp_calibration,8,0.11734693880000001,0.1020408163,0.1275510204,qwen2.5-7b-instruct,ner
sst2,dp_calibration,16,0.11224489800000001,0.1071428571,0.11734693880000001,qwen2.5-7b-instruct,ner
sst2,dp_calibration,32,0.11224489800000001,0.1071428571,0.11734693880000001,qwen2.5-7b-instruct,ner
sst2,dp_calibration,64,0.1071428571,0.1071428571,0.1071428571,qwen2.5-7b-instruct,ner
sst2,dp_calibration,128,0.11224489800000001,0.1020408163,0.11224489800000001,qwen2.5-7b-instruct,ner
sst2,dp_calibration,256,0.11224489800000001,0.1020408163,0.11224489800000001,qwen2.5-7b-instruct,ner
sst2,lora_1.0_no_es,8,0.1071428571,0.1020408163,0.1275510204,qwen2.5-7b-instruct,ner
sst2,lora_1.0_no_es,16,0.1071428571,0.1020408163,0.12244897960000001,qwen2.5-7b-instruct,ner
sst2,lora_1.0_no_es,32,0.1020408163,0.0918367347,0.11734693880000001,qwen2.5-7b-instruct,ner
sst2,lora_1.0_no_es,64,0.1020408163,0.0918367347,0.12244897960000001,qwen2.5-7b-instruct,ner
sst2,lora_1.0_no_es,128,0.1020408163,0.1020408163,0.1020408163,qwen2.5-7b-instruct,ner
sst2,lora_1.0_no_es,256,0.0969387755,0.0867346939,0.1071428571,qwen2.5-7b-instruct,ner
sst2,lora_1.0_no_es_plus_tempscaling,8,0.1071428571,0.1020408163,0.1275510204,qwen2.5-7b-instruct,ner
sst2,lora_1.0_no_es_plus_tempscaling,16,0.1071428571,0.1020408163,0.12244897960000001,qwen2.5-7b-instruct,ner
sst2,lora_1.0_no_es_plus_tempscaling,32,0.1020408163,0.0918367347,0.11734693880000001,qwen2.5-7b-instruct,ner
sst2,lora_1.0_no_es_plus_tempscaling,64,0.1020408163,0.0918367347,0.12244897960000001,qwen2.5-7b-instruct,ner
sst2,lora_1.0_no_es_plus_tempscaling,128,0.1020408163,0.1020408163,0.1020408163,qwen2.5-7b-instruct,ner
sst2,lora_1.0_no_es_plus_tempscaling,256,0.0969387755,0.0867346939,0.1071428571,qwen2.5-7b-instruct,ner
sst2,no_adaptation,all,0.11224489800000001,0.11224489800000001,0.11224489800000001,qwen2.5-7b-instruct,ner