File size: 15,678 Bytes
1892d8f
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
{
  "dataset_revision": "1f7e6a9d6fa6e64c53d146e428565640410c0df1",
  "task_name": "AmazonCounterfactualClassification",
  "mteb_version": "2.10.7",
  "scores": {
    "validation": [
      {
        "scores_per_experiment": [
          {
            "accuracy": 0.753754,
            "f1": 0.623225,
            "f1_weighted": 0.800371,
            "precision": 0.619778,
            "precision_weighted": 0.902615,
            "recall": 0.78357,
            "recall_weighted": 0.753754,
            "ap": 0.23613,
            "ap_weighted": 0.23613
          },
          {
            "accuracy": 0.704204,
            "f1": 0.571116,
            "f1_weighted": 0.761959,
            "precision": 0.586908,
            "precision_weighted": 0.884058,
            "recall": 0.716256,
            "recall_weighted": 0.704204,
            "ap": 0.184202,
            "ap_weighted": 0.184202
          },
          {
            "accuracy": 0.728228,
            "f1": 0.611557,
            "f1_weighted": 0.781609,
            "precision": 0.620103,
            "precision_weighted": 0.910621,
            "recall": 0.802519,
            "recall_weighted": 0.728228,
            "ap": 0.240132,
            "ap_weighted": 0.240132
          },
          {
            "accuracy": 0.659159,
            "f1": 0.545546,
            "f1_weighted": 0.727054,
            "precision": 0.582124,
            "precision_weighted": 0.887965,
            "recall": 0.717726,
            "recall_weighted": 0.659159,
            "ap": 0.178635,
            "ap_weighted": 0.178635
          },
          {
            "accuracy": 0.71021,
            "f1": 0.587738,
            "f1_weighted": 0.767229,
            "precision": 0.602572,
            "precision_weighted": 0.897745,
            "recall": 0.759363,
            "recall_weighted": 0.71021,
            "ap": 0.209328,
            "ap_weighted": 0.209328
          },
          {
            "accuracy": 0.684685,
            "f1": 0.56812,
            "f1_weighted": 0.747347,
            "precision": 0.594168,
            "precision_weighted": 0.895136,
            "recall": 0.745172,
            "recall_weighted": 0.684685,
            "ap": 0.196474,
            "ap_weighted": 0.196474
          },
          {
            "accuracy": 0.701201,
            "f1": 0.578823,
            "f1_weighted": 0.760175,
            "precision": 0.597242,
            "precision_weighted": 0.894588,
            "recall": 0.747726,
            "recall_weighted": 0.701201,
            "ap": 0.200863,
            "ap_weighted": 0.200863
          },
          {
            "accuracy": 0.698198,
            "f1": 0.568635,
            "f1_weighted": 0.757478,
            "precision": 0.587162,
            "precision_weighted": 0.885502,
            "recall": 0.719545,
            "recall_weighted": 0.698198,
            "ap": 0.184985,
            "ap_weighted": 0.184985
          },
          {
            "accuracy": 0.747748,
            "f1": 0.625988,
            "f1_weighted": 0.796452,
            "precision": 0.625755,
            "precision_weighted": 0.910405,
            "recall": 0.806743,
            "recall_weighted": 0.747748,
            "ap": 0.24925,
            "ap_weighted": 0.24925
          },
          {
            "accuracy": 0.708709,
            "f1": 0.568105,
            "f1_weighted": 0.76495,
            "precision": 0.581533,
            "precision_weighted": 0.878276,
            "recall": 0.698876,
            "recall_weighted": 0.708709,
            "ap": 0.175742,
            "ap_weighted": 0.175742
          }
        ],
        "accuracy": 0.70961,
        "f1": 0.584885,
        "f1_weighted": 0.766462,
        "precision": 0.599734,
        "precision_weighted": 0.894691,
        "recall": 0.74975,
        "recall_weighted": 0.70961,
        "ap": 0.205574,
        "ap_weighted": 0.205574,
        "main_score": 0.70961,
        "hf_subset": "en-ext",
        "languages": [
          "eng-Latn"
        ]
      },
      {
        "scores_per_experiment": [
          {
            "accuracy": 0.665672,
            "f1": 0.611594,
            "f1_weighted": 0.706338,
            "precision": 0.636594,
            "precision_weighted": 0.842013,
            "recall": 0.736493,
            "recall_weighted": 0.665672,
            "ap": 0.299211,
            "ap_weighted": 0.299211
          },
          {
            "accuracy": 0.701493,
            "f1": 0.637226,
            "f1_weighted": 0.737044,
            "precision": 0.645156,
            "precision_weighted": 0.840993,
            "recall": 0.744523,
            "recall_weighted": 0.701493,
            "ap": 0.312881,
            "ap_weighted": 0.312881
          },
          {
            "accuracy": 0.60597,
            "f1": 0.546852,
            "f1_weighted": 0.653851,
            "precision": 0.583924,
            "precision_weighted": 0.79384,
            "recall": 0.645867,
            "recall_weighted": 0.60597,
            "ap": 0.236533,
            "ap_weighted": 0.236533
          },
          {
            "accuracy": 0.677612,
            "f1": 0.605779,
            "f1_weighted": 0.715789,
            "precision": 0.616915,
            "precision_weighted": 0.815312,
            "recall": 0.696004,
            "recall_weighted": 0.677612,
            "ap": 0.27473,
            "ap_weighted": 0.27473
          },
          {
            "accuracy": 0.692537,
            "f1": 0.622851,
            "f1_weighted": 0.728832,
            "precision": 0.63076,
            "precision_weighted": 0.826836,
            "recall": 0.718661,
            "recall_weighted": 0.692537,
            "ap": 0.292763,
            "ap_weighted": 0.292763
          },
          {
            "accuracy": 0.689552,
            "f1": 0.596311,
            "f1_weighted": 0.723142,
            "precision": 0.598351,
            "precision_weighted": 0.792265,
            "recall": 0.655515,
            "recall_weighted": 0.689552,
            "ap": 0.250732,
            "ap_weighted": 0.250732
          },
          {
            "accuracy": 0.695522,
            "f1": 0.609825,
            "f1_weighted": 0.729365,
            "precision": 0.611822,
            "precision_weighted": 0.804774,
            "recall": 0.679572,
            "recall_weighted": 0.695522,
            "ap": 0.267173,
            "ap_weighted": 0.267173
          },
          {
            "accuracy": 0.674627,
            "f1": 0.57847,
            "f1_weighted": 0.710085,
            "precision": 0.583686,
            "precision_weighted": 0.780874,
            "recall": 0.632858,
            "recall_weighted": 0.674627,
            "ap": 0.235104,
            "ap_weighted": 0.235104
          },
          {
            "accuracy": 0.692537,
            "f1": 0.622851,
            "f1_weighted": 0.728832,
            "precision": 0.63076,
            "precision_weighted": 0.826836,
            "recall": 0.718661,
            "recall_weighted": 0.692537,
            "ap": 0.292763,
            "ap_weighted": 0.292763
          },
          {
            "accuracy": 0.647761,
            "f1": 0.57702,
            "f1_weighted": 0.690103,
            "precision": 0.596703,
            "precision_weighted": 0.800007,
            "recall": 0.664322,
            "recall_weighted": 0.647761,
            "ap": 0.250776,
            "ap_weighted": 0.250776
          }
        ],
        "accuracy": 0.674328,
        "f1": 0.600878,
        "f1_weighted": 0.712338,
        "precision": 0.613467,
        "precision_weighted": 0.812375,
        "recall": 0.689247,
        "recall_weighted": 0.674328,
        "ap": 0.271267,
        "ap_weighted": 0.271267,
        "main_score": 0.674328,
        "hf_subset": "en",
        "languages": [
          "eng-Latn"
        ]
      }
    ],
    "test": [
      {
        "scores_per_experiment": [
          {
            "accuracy": 0.787106,
            "f1": 0.6618,
            "f1_weighted": 0.82476,
            "precision": 0.644837,
            "precision_weighted": 0.909338,
            "recall": 0.817597,
            "recall_weighted": 0.787106,
            "ap": 0.280992,
            "ap_weighted": 0.280992
          },
          {
            "accuracy": 0.736882,
            "f1": 0.615747,
            "f1_weighted": 0.786532,
            "precision": 0.618779,
            "precision_weighted": 0.900943,
            "recall": 0.783206,
            "recall_weighted": 0.736882,
            "ap": 0.237303,
            "ap_weighted": 0.237303
          },
          {
            "accuracy": 0.742879,
            "f1": 0.625424,
            "f1_weighted": 0.791464,
            "precision": 0.626567,
            "precision_weighted": 0.906989,
            "recall": 0.802447,
            "recall_weighted": 0.742879,
            "ap": 0.25176,
            "ap_weighted": 0.25176
          },
          {
            "accuracy": 0.658171,
            "f1": 0.537212,
            "f1_weighted": 0.724503,
            "precision": 0.570547,
            "precision_weighted": 0.870972,
            "recall": 0.678878,
            "recall_weighted": 0.658171,
            "ap": 0.16542,
            "ap_weighted": 0.16542
          },
          {
            "accuracy": 0.754873,
            "f1": 0.629012,
            "f1_weighted": 0.800066,
            "precision": 0.624459,
            "precision_weighted": 0.900998,
            "recall": 0.786891,
            "recall_weighted": 0.754873,
            "ap": 0.245608,
            "ap_weighted": 0.245608
          },
          {
            "accuracy": 0.715892,
            "f1": 0.59492,
            "f1_weighted": 0.770155,
            "precision": 0.606268,
            "precision_weighted": 0.894236,
            "recall": 0.758776,
            "recall_weighted": 0.715892,
            "ap": 0.216622,
            "ap_weighted": 0.216622
          },
          {
            "accuracy": 0.715142,
            "f1": 0.59242,
            "f1_weighted": 0.769462,
            "precision": 0.603797,
            "precision_weighted": 0.891985,
            "recall": 0.752,
            "recall_weighted": 0.715142,
            "ap": 0.212437,
            "ap_weighted": 0.212437
          },
          {
            "accuracy": 0.718891,
            "f1": 0.595394,
            "f1_weighted": 0.772344,
            "precision": 0.605197,
            "precision_weighted": 0.892422,
            "recall": 0.754092,
            "recall_weighted": 0.718891,
            "ap": 0.214527,
            "ap_weighted": 0.214527
          },
          {
            "accuracy": 0.750375,
            "f1": 0.624186,
            "f1_weighted": 0.796573,
            "precision": 0.621365,
            "precision_weighted": 0.899394,
            "recall": 0.781202,
            "recall_weighted": 0.750375,
            "ap": 0.240296,
            "ap_weighted": 0.240296
          },
          {
            "accuracy": 0.732384,
            "f1": 0.608214,
            "f1_weighted": 0.782812,
            "precision": 0.612646,
            "precision_weighted": 0.896151,
            "recall": 0.767981,
            "recall_weighted": 0.732384,
            "ap": 0.22639,
            "ap_weighted": 0.22639
          }
        ],
        "accuracy": 0.731259,
        "f1": 0.608433,
        "f1_weighted": 0.781867,
        "precision": 0.613446,
        "precision_weighted": 0.896343,
        "recall": 0.768307,
        "recall_weighted": 0.731259,
        "ap": 0.229135,
        "ap_weighted": 0.229135,
        "main_score": 0.731259,
        "hf_subset": "en-ext",
        "languages": [
          "eng-Latn"
        ]
      },
      {
        "scores_per_experiment": [
          {
            "accuracy": 0.683582,
            "f1": 0.638763,
            "f1_weighted": 0.716247,
            "precision": 0.65592,
            "precision_weighted": 0.832264,
            "recall": 0.745557,
            "recall_weighted": 0.683582,
            "ap": 0.340258,
            "ap_weighted": 0.340258
          },
          {
            "accuracy": 0.704478,
            "f1": 0.648188,
            "f1_weighted": 0.733883,
            "precision": 0.651851,
            "precision_weighted": 0.819598,
            "recall": 0.732541,
            "recall_weighted": 0.704478,
            "ap": 0.336346,
            "ap_weighted": 0.336346
          },
          {
            "accuracy": 0.653731,
            "f1": 0.607475,
            "f1_weighted": 0.68953,
            "precision": 0.630889,
            "precision_weighted": 0.810116,
            "recall": 0.70678,
            "recall_weighted": 0.653731,
            "ap": 0.307499,
            "ap_weighted": 0.307499
          },
          {
            "accuracy": 0.692537,
            "f1": 0.637034,
            "f1_weighted": 0.723467,
            "precision": 0.644143,
            "precision_weighted": 0.814359,
            "recall": 0.722231,
            "recall_weighted": 0.692537,
            "ap": 0.325896,
            "ap_weighted": 0.325896
          },
          {
            "accuracy": 0.71194,
            "f1": 0.657558,
            "f1_weighted": 0.740659,
            "precision": 0.660351,
            "precision_weighted": 0.827401,
            "recall": 0.745847,
            "recall_weighted": 0.71194,
            "ap": 0.348219,
            "ap_weighted": 0.348219
          },
          {
            "accuracy": 0.702985,
            "f1": 0.645907,
            "f1_weighted": 0.732479,
            "precision": 0.649537,
            "precision_weighted": 0.817282,
            "recall": 0.728724,
            "recall_weighted": 0.702985,
            "ap": 0.333184,
            "ap_weighted": 0.333184
          },
          {
            "accuracy": 0.755224,
            "f1": 0.685197,
            "f1_weighted": 0.775611,
            "precision": 0.672736,
            "precision_weighted": 0.822982,
            "recall": 0.743857,
            "recall_weighted": 0.755224,
            "ap": 0.362669,
            "ap_weighted": 0.362669
          },
          {
            "accuracy": 0.735821,
            "f1": 0.675433,
            "f1_weighted": 0.760687,
            "precision": 0.669476,
            "precision_weighted": 0.828703,
            "recall": 0.752022,
            "recall_weighted": 0.735821,
            "ap": 0.360963,
            "ap_weighted": 0.360963
          },
          {
            "accuracy": 0.650746,
            "f1": 0.599336,
            "f1_weighted": 0.686734,
            "precision": 0.619405,
            "precision_weighted": 0.797005,
            "recall": 0.687589,
            "recall_weighted": 0.650746,
            "ap": 0.294448,
            "ap_weighted": 0.294448
          },
          {
            "accuracy": 0.658209,
            "f1": 0.604451,
            "f1_weighted": 0.69325,
            "precision": 0.621122,
            "precision_weighted": 0.797068,
            "recall": 0.689338,
            "recall_weighted": 0.658209,
            "ap": 0.29672,
            "ap_weighted": 0.29672
          }
        ],
        "accuracy": 0.694925,
        "f1": 0.639934,
        "f1_weighted": 0.725255,
        "precision": 0.647543,
        "precision_weighted": 0.816678,
        "recall": 0.725449,
        "recall_weighted": 0.694925,
        "ap": 0.33062,
        "ap_weighted": 0.33062,
        "main_score": 0.694925,
        "hf_subset": "en",
        "languages": [
          "eng-Latn"
        ]
      }
    ]
  },
  "evaluation_time": 46.4682559967041,
  "kg_co2_emissions": null,
  "date": null
}