amirali1985 commited on
Commit
37d7571
·
verified ·
1 Parent(s): 80733ca

Upload add_sub_sorl_v1_abs50_50K

Browse files
add_sub_sorl_v1_abs50_50K/metrics.json CHANGED
@@ -153,1069 +153,1069 @@
153
  7788
154
  ],
155
  "loss": [
156
- 7.256625652313232,
157
- 3.0191478729248047,
158
- 2.4123916625976562,
159
- 2.1674225330352783,
160
- 2.1556787490844727,
161
- 1.8286030292510986,
162
- 2.14564847946167,
163
- 1.900666356086731,
164
- 1.652380108833313,
165
- 1.6646597385406494,
166
- 1.5041191577911377,
167
- 1.546173334121704,
168
- 0.7197972536087036,
169
- 0.08199936151504517,
170
- -3.1339755058288574,
171
- -10.444205284118652,
172
- -10.103414535522461,
173
- -12.214149475097656,
174
- -12.902936935424805,
175
- -13.465953826904297,
176
- -13.666388511657715,
177
- -14.849788665771484,
178
- -14.489677429199219,
179
- -14.085216522216797,
180
- -15.04929256439209,
181
- -14.683259010314941,
182
- -13.91379451751709,
183
- -15.094310760498047,
184
- -13.880881309509277,
185
- -14.374068260192871,
186
- -14.42313003540039,
187
- -14.229098320007324,
188
- -15.09312629699707,
189
- -14.730694770812988,
190
- -14.6654634475708,
191
- -13.932817459106445,
192
- -14.541162490844727,
193
- -13.534533500671387,
194
- -14.629840850830078,
195
- -14.549479484558105,
196
- -14.572128295898438,
197
- -14.297953605651855,
198
- -14.748451232910156,
199
- -14.658515930175781,
200
- -14.846949577331543,
201
- -14.570510864257812,
202
- -14.642899513244629,
203
- -15.091267585754395,
204
- -14.61697769165039,
205
- -14.35709285736084,
206
- -14.233384132385254,
207
- -13.99492073059082,
208
- -13.887598037719727,
209
- -13.822426795959473,
210
- -13.868623733520508,
211
- -13.392026901245117,
212
- -14.518260955810547,
213
- -12.745328903198242,
214
- -9.385150909423828,
215
- -8.4232177734375,
216
- -5.4400715827941895,
217
- -5.325277805328369,
218
- -5.132301330566406,
219
- -4.313063621520996,
220
- -3.695901870727539,
221
- -3.7530672550201416,
222
- -3.7038750648498535,
223
- -3.661875009536743,
224
- -3.2753937244415283,
225
- -3.360624074935913,
226
- -2.504333257675171,
227
- -3.0331249237060547,
228
- -3.0124270915985107,
229
- -2.910573720932007,
230
- -3.7368786334991455,
231
- -2.7395472526550293,
232
- -2.6733858585357666,
233
- -2.886018991470337,
234
- -2.6889913082122803,
235
- -2.5152089595794678,
236
- -2.2789855003356934,
237
- -2.7361295223236084,
238
- -2.4921624660491943,
239
- -2.7641701698303223,
240
- -4.348557949066162,
241
- -2.480908155441284,
242
- -2.207150936126709,
243
- -2.63488507270813,
244
- -2.250746726989746,
245
- -2.611670970916748,
246
- -2.541576385498047,
247
- -2.34275484085083,
248
- -2.689805746078491,
249
- -2.281898021697998,
250
- -2.7649309635162354,
251
- -2.1240293979644775,
252
- -2.607470750808716,
253
- -2.4728121757507324,
254
- -2.0544490814208984,
255
- -2.0300307273864746,
256
- -2.1023619174957275,
257
- -1.887721061706543,
258
- -2.0482027530670166,
259
- -1.9892445802688599,
260
- -1.9722803831100464,
261
- -2.084959030151367,
262
- -2.446387529373169,
263
- -1.835938811302185,
264
- -2.5824408531188965,
265
- -2.1360812187194824,
266
- -1.9915828704833984,
267
- -1.6431983709335327,
268
- -1.4731082916259766,
269
- -1.7144525051116943,
270
- -1.7019168138504028,
271
- -1.6519891023635864,
272
- -1.7413341999053955,
273
- -1.588895320892334,
274
- -1.539756417274475,
275
- -1.904645562171936,
276
- -1.5546034574508667,
277
- -1.7151820659637451,
278
- -1.450798511505127,
279
- -1.574430227279663,
280
- -1.8458795547485352,
281
- -1.5194255113601685,
282
- -1.6603127717971802,
283
- -2.0166845321655273,
284
- -1.2642289400100708,
285
- -1.7409981489181519,
286
- -1.6157901287078857,
287
- -1.5526642799377441,
288
- -1.2320806980133057,
289
- -1.5149484872817993,
290
- -1.4476909637451172,
291
- -1.6797325611114502,
292
- -1.3895442485809326,
293
- -1.231076717376709,
294
- -1.2591882944107056,
295
- -1.7371399402618408,
296
- -1.5310636758804321,
297
- -1.4542627334594727,
298
- -1.2413599491119385,
299
- -1.226067304611206,
300
- -1.6244958639144897,
301
- -1.3765522241592407,
302
- -1.362652063369751,
303
- -1.392403244972229,
304
- -1.3551605939865112,
305
- -1.0807950496673584
306
  ],
307
  "base_loss": [
308
- 6.029807090759277,
309
- 2.3067009449005127,
310
- 1.9342564344406128,
311
- 1.8905317783355713,
312
- 1.8440930843353271,
313
- 1.8317269086837769,
314
- 1.8801648616790771,
315
- 1.8195487260818481,
316
- 1.7616671323776245,
317
- 1.7560369968414307,
318
- 1.7867367267608643,
319
- 1.7833213806152344,
320
- 1.7948106527328491,
321
- 1.7519046068191528,
322
- 1.948911428451538,
323
- 2.001823902130127,
324
- 1.8075017929077148,
325
- 1.8323737382888794,
326
- 1.797086477279663,
327
- 1.8139381408691406,
328
- 1.751043438911438,
329
- 1.8313592672348022,
330
- 1.751556634902954,
331
- 1.7140840291976929,
332
- 1.789836049079895,
333
- 1.7125715017318726,
334
- 1.6791929006576538,
335
- 1.7678550481796265,
336
- 1.6537859439849854,
337
- 1.6602624654769897,
338
- 1.6753387451171875,
339
- 1.6629526615142822,
340
- 1.7369420528411865,
341
- 1.683754563331604,
342
- 1.6948719024658203,
343
- 1.6238089799880981,
344
- 1.6669832468032837,
345
- 1.5685263872146606,
346
- 1.6912544965744019,
347
- 1.6462609767913818,
348
- 1.6818253993988037,
349
- 1.636511206626892,
350
- 1.6857174634933472,
351
- 1.669575810432434,
352
- 1.6751861572265625,
353
- 1.6484739780426025,
354
- 1.6467863321304321,
355
- 1.6952067613601685,
356
- 1.6533762216567993,
357
- 1.616503357887268,
358
- 1.6140310764312744,
359
- 1.5757274627685547,
360
- 1.5750893354415894,
361
- 1.556767225265503,
362
- 1.5602978467941284,
363
- 1.515640139579773,
364
- 1.6252305507659912,
365
- 1.4415589570999146,
366
- 1.0609798431396484,
367
- 0.9612196683883667,
368
- 0.616158127784729,
369
- 0.6064944863319397,
370
- 0.5862141251564026,
371
- 0.4924693703651428,
372
- 0.4313984513282776,
373
- 0.42700475454330444,
374
- 0.42180582880973816,
375
- 0.41957685351371765,
376
- 0.37408900260925293,
377
- 0.38498300313949585,
378
- 0.28954702615737915,
379
- 0.348208487033844,
380
- 0.3462330996990204,
381
- 0.3341756761074066,
382
- 0.4224683344364166,
383
- 0.3134305477142334,
384
- 0.3083657920360565,
385
- 0.3302149474620819,
386
- 0.30693626403808594,
387
- 0.2877400815486908,
388
- 0.2639155685901642,
389
- 0.3185356557369232,
390
- 0.2856982350349426,
391
- 0.31456050276756287,
392
- 0.49335941672325134,
393
- 0.28367578983306885,
394
- 0.25294229388237,
395
- 0.30259618163108826,
396
- 0.2595691978931427,
397
- 0.30289167165756226,
398
- 0.291527658700943,
399
- 0.26810169219970703,
400
- 0.3059633672237396,
401
- 0.2611132562160492,
402
- 0.3158523738384247,
403
- 0.2444075345993042,
404
- 0.29604029655456543,
405
- 0.2825319468975067,
406
- 0.23427459597587585,
407
- 0.23259370028972626,
408
- 0.2404058873653412,
409
- 0.21756012737751007,
410
- 0.23280969262123108,
411
- 0.22855813801288605,
412
- 0.2257063388824463,
413
- 0.23912663757801056,
414
- 0.27966248989105225,
415
- 0.21003004908561707,
416
- 0.29382458329200745,
417
- 0.2435278445482254,
418
- 0.2295869141817093,
419
- 0.18904468417167664,
420
- 0.17142455279827118,
421
- 0.1948322355747223,
422
- 0.19676467776298523,
423
- 0.19100677967071533,
424
- 0.19870205223560333,
425
- 0.18229179084300995,
426
- 0.17854009568691254,
427
- 0.2182820737361908,
428
- 0.1792173683643341,
429
- 0.19656817615032196,
430
- 0.16844725608825684,
431
- 0.18259193003177643,
432
- 0.21280623972415924,
433
- 0.17412368953227997,
434
- 0.19087910652160645,
435
- 0.22902394831180573,
436
- 0.14896346628665924,
437
- 0.20004956424236298,
438
- 0.18591725826263428,
439
- 0.17941395938396454,
440
- 0.14243106544017792,
441
- 0.17380957305431366,
442
- 0.16619420051574707,
443
- 0.19304493069648743,
444
- 0.15973064303398132,
445
- 0.1419793665409088,
446
- 0.1448678970336914,
447
- 0.2004563808441162,
448
- 0.17605385184288025,
449
- 0.16834628582000732,
450
- 0.14428769052028656,
451
- 0.14093129336833954,
452
- 0.18535971641540527,
453
- 0.1585533171892166,
454
- 0.1568572074174881,
455
- 0.15938758850097656,
456
- 0.15521882474422455,
457
- 0.126205712556839
458
  ],
459
  "info_loss": [
460
- -0.20561504364013672,
461
- -0.03972625732421875,
462
- -0.048748135566711426,
463
- -0.06750452518463135,
464
- -0.06405246257781982,
465
- -0.09477114677429199,
466
- -0.06761360168457031,
467
- -0.08672130107879639,
468
- -0.10533666610717773,
469
- -0.10386943817138672,
470
- -0.12152564525604248,
471
- -0.11574661731719971,
472
- -0.19611811637878418,
473
- -0.24177753925323486,
474
- -0.5657413005828857,
475
- -1.2865196466445923,
476
- -1.2276489734649658,
477
- -1.4379183053970337,
478
- -1.5007377862930298,
479
- -1.5571799278259277,
480
- -1.5694807767868042,
481
- -1.6956429481506348,
482
- -1.6478774547576904,
483
- -1.6037368774414062,
484
- -1.7057857513427734,
485
- -1.6578631401062012,
486
- -1.5784200429916382,
487
- -1.7046573162078857,
488
- -1.569814682006836,
489
- -1.6190284490585327,
490
- -1.6252418756484985,
491
- -1.6039395332336426,
492
- -1.6967638731002808,
493
- -1.6540355682373047,
494
- -1.6475841999053955,
495
- -1.5689774751663208,
496
- -1.635087251663208,
497
- -1.5238193273544312,
498
- -1.6450031995773315,
499
- -1.630631685256958,
500
- -1.637630820274353,
501
- -1.6060518026351929,
502
- -1.6621246337890625,
503
- -1.6464064121246338,
504
- -1.6617577075958252,
505
- -1.6344650983810425,
506
- -1.6399197578430176,
507
- -1.6889852285385132,
508
- -1.639074444770813,
509
- -1.6081275939941406,
510
- -1.5951539278030396,
511
- -1.566024661064148,
512
- -1.5557743310928345,
513
- -1.5495342016220093,
514
- -1.5556063652038574,
515
- -1.5009874105453491,
516
- -1.6231387853622437,
517
- -1.4322359561920166,
518
- -1.0561802387237549,
519
- -0.9466190338134766,
520
- -0.6137336492538452,
521
- -0.6038743257522583,
522
- -0.5819218754768372,
523
- -0.4909442663192749,
524
- -0.4217419922351837,
525
- -0.4254307448863983,
526
- -0.4203161597251892,
527
- -0.4181394577026367,
528
- -0.3734082281589508,
529
- -0.38232800364494324,
530
- -0.2871572971343994,
531
- -0.34667515754699707,
532
- -0.3433464467525482,
533
- -0.3323284983634949,
534
- -0.4220069944858551,
535
- -0.3129675090312958,
536
- -0.30473649501800537,
537
- -0.32990047335624695,
538
- -0.3063972592353821,
539
- -0.28762325644493103,
540
- -0.2610863447189331,
541
- -0.312552273273468,
542
- -0.2848331332206726,
543
- -0.3143031597137451,
544
- -0.49174460768699646,
545
- -0.2831017076969147,
546
- -0.25272035598754883,
547
- -0.3016011118888855,
548
- -0.2592092454433441,
549
- -0.2988108992576599,
550
- -0.2913071811199188,
551
- -0.2679586410522461,
552
- -0.3054676353931427,
553
- -0.26094746589660645,
554
- -0.3152065873146057,
555
- -0.24421927332878113,
556
- -0.295553594827652,
557
- -0.28226152062416077,
558
- -0.2340558022260666,
559
- -0.23213818669319153,
560
- -0.24020898342132568,
561
- -0.21750272810459137,
562
- -0.23276019096374512,
563
- -0.22842691838741302,
564
- -0.22563359141349792,
565
- -0.23904889822006226,
566
- -0.2794150114059448,
567
- -0.20988059043884277,
568
- -0.29378125071525574,
569
- -0.24314871430397034,
570
- -0.2293650060892105,
571
- -0.18900363147258759,
572
- -0.17137543857097626,
573
- -0.1948050558567047,
574
- -0.19659706950187683,
575
- -0.19093747437000275,
576
- -0.19865652918815613,
577
- -0.1822470873594284,
578
- -0.1785041093826294,
579
- -0.21816547214984894,
580
- -0.17919395864009857,
581
- -0.19648776948451996,
582
- -0.16839498281478882,
583
- -0.18214161694049835,
584
- -0.212591290473938,
585
- -0.17409944534301758,
586
- -0.19081123173236847,
587
- -0.2289951741695404,
588
- -0.14660219848155975,
589
- -0.20001469552516937,
590
- -0.18589811027050018,
591
- -0.1793726533651352,
592
- -0.14236652851104736,
593
- -0.1737845093011856,
594
- -0.16613999009132385,
595
- -0.19301597774028778,
596
- -0.15971405804157257,
597
- -0.14195962250232697,
598
- -0.14485248923301697,
599
- -0.20041891932487488,
600
- -0.17602841556072235,
601
- -0.16832193732261658,
602
- -0.14427153766155243,
603
- -0.14090751111507416,
604
- -0.18532036244869232,
605
- -0.1585266888141632,
606
- -0.15683983266353607,
607
- -0.15936271846294403,
608
- -0.1551767736673355,
609
- -0.12618587911128998
610
  ],
611
  "abs_loss": [
612
- 3.7497520446777344,
613
- 2.6481971740722656,
614
- 2.8985848426818848,
615
- 2.818944215774536,
616
- 2.870543956756592,
617
- 2.872476100921631,
618
- 2.758188247680664,
619
- 2.8428196907043457,
620
- 2.7872250080108643,
621
- 2.910464286804199,
622
- 2.752615213394165,
623
- 2.7820749282836914,
624
- 2.7789087295532227,
625
- 2.835494041442871,
626
- 2.5386619567871094,
627
- 2.0468544960021973,
628
- 1.7976104021072388,
629
- 1.6245003938674927,
630
- 1.4929277896881104,
631
- 1.4750802516937256,
632
- 1.5771673917770386,
633
- 1.666552186012268,
634
- 1.0843603610992432,
635
- 1.545884132385254,
636
- 1.4265331029891968,
637
- 0.999521017074585,
638
- 1.2854008674621582,
639
- 1.195152759552002,
640
- 1.1227796077728271,
641
- 0.9406141042709351,
642
- 1.0983028411865234,
643
- 0.85012286901474,
644
- 0.8116261959075928,
645
- 0.7224507927894592,
646
- 0.8427834510803223,
647
- 0.8805156946182251,
648
- 0.8626446723937988,
649
- 0.9968369007110596,
650
- 0.9508752822875977,
651
- 0.8513461351394653,
652
- 0.6574622392654419,
653
- 0.8986561298370361,
654
- 0.5942917466163635,
655
- 0.7797585129737854,
656
- 0.7031676173210144,
657
- 0.6163696050643921,
658
- 0.6315547227859497,
659
- 0.7303791046142578,
660
- 0.5330150723457336,
661
- 0.5637519359588623,
662
- 0.5594895482063293,
663
- 0.5726730823516846,
664
- 0.5400386452674866,
665
- 0.5256966352462769,
666
- 0.44924086332321167,
667
- 0.47774025797843933,
668
- 0.5889784097671509,
669
- 0.4862280488014221,
670
- 0.5457887649536133,
671
- 0.4811607599258423,
672
- 0.5763522982597351,
673
- 0.4618305563926697,
674
- 0.49888068437576294,
675
- 0.5134003758430481,
676
- 0.4723852872848511,
677
- 0.4225727915763855,
678
- 0.3785339295864105,
679
- 0.3270162343978882,
680
- 0.3133487105369568,
681
- 0.33950677514076233,
682
- 0.32967162132263184,
683
- 0.3334130644798279,
684
- 0.31977397203445435,
685
- 0.39836356043815613,
686
- 0.3870335817337036,
687
- 0.27905893325805664,
688
- 0.38264474272727966,
689
- 0.3101273775100708,
690
- 0.2242627888917923,
691
- 0.24193796515464783,
692
- 0.222909078001976,
693
- 0.20927608013153076,
694
- 0.23676183819770813,
695
- 0.30053985118865967,
696
- 0.34205877780914307,
697
- 0.22115281224250793,
698
- 0.252194344997406,
699
- 0.2795361876487732,
700
- 0.2963107228279114,
701
- 0.26521268486976624,
702
- 0.3244202733039856,
703
- 0.28083187341690063,
704
- 0.18782655894756317,
705
- 0.273157000541687,
706
- 0.21937644481658936,
707
- 0.2191070020198822,
708
- 0.2309451699256897,
709
- 0.2086794078350067,
710
- 0.20153307914733887,
711
- 0.2183530181646347,
712
- 0.17671014368534088,
713
- 0.1841510534286499,
714
- 0.22086754441261292,
715
- 0.23169928789138794,
716
- 0.27007248997688293,
717
- 0.20892009139060974,
718
- 0.17916454374790192,
719
- 0.20730438828468323,
720
- 0.20521558821201324,
721
- 0.17557865381240845,
722
- 0.18920457363128662,
723
- 0.20690660178661346,
724
- 0.1799832135438919,
725
- 0.15656515955924988,
726
- 0.18862086534500122,
727
- 0.17772457003593445,
728
- 0.17366942763328552,
729
- 0.16974030435085297,
730
- 0.16747745871543884,
731
- 0.16128060221672058,
732
- 0.19063544273376465,
733
- 0.1916358768939972,
734
- 0.20035310089588165,
735
- 0.16092176735401154,
736
- 0.1909703016281128,
737
- 0.1657269448041916,
738
- 0.1640641689300537,
739
- 0.14971278607845306,
740
- 0.10842731595039368,
741
- 0.2196534425020218,
742
- 0.16537384688854218,
743
- 0.1963886320590973,
744
- 0.16384944319725037,
745
- 0.13870114088058472,
746
- 0.147671639919281,
747
- 0.17166978120803833,
748
- 0.15626773238182068,
749
- 0.17788034677505493,
750
- 0.1344836950302124,
751
- 0.1465415060520172,
752
- 0.19216865301132202,
753
- 0.13693669438362122,
754
- 0.1630391776561737,
755
- 0.11989884078502655,
756
- 0.1325468271970749,
757
- 0.1899355947971344,
758
- 0.12264394760131836,
759
- 0.12508927285671234,
760
- 0.1484333872795105,
761
- 0.13628548383712769
762
  ],
763
  "zipf_loss": [
764
- 2.907993793487549,
765
- 0.8448899388313293,
766
- 0.6757582426071167,
767
- 0.6700415015220642,
768
- 0.6650558114051819,
769
- 0.6573399305343628,
770
- 0.6658006906509399,
771
- 0.6640486717224121,
772
- 0.6653571128845215,
773
- 0.6562708020210266,
774
- 0.6573773622512817,
775
- 0.6421106457710266,
776
- 0.6082768440246582,
777
- 0.46432074904441833,
778
- 0.3206597566604614,
779
- 0.21448186039924622,
780
- 0.1858120709657669,
781
- 0.17020957171916962,
782
- 0.1580614596605301,
783
- 0.14439967274665833,
784
- 0.11965931951999664,
785
- 0.1086258664727211,
786
- 0.12910524010658264,
787
- 0.08348017930984497,
788
- 0.07607515156269073,
789
- 0.0828506276011467,
790
- 0.06267359852790833,
791
- 0.06489258259534836,
792
- 0.051201872527599335,
793
- 0.06189261004328728,
794
- 0.04411982744932175,
795
- 0.06233106553554535,
796
- 0.05640706419944763,
797
- 0.05366092175245285,
798
- 0.031228451058268547,
799
- 0.04509659856557846,
800
- 0.05646108090877533,
801
- 0.0354497954249382,
802
- 0.033848002552986145,
803
- 0.025441396981477737,
804
- 0.05660788342356682,
805
- 0.0361880287528038,
806
- 0.12764789164066315,
807
- 0.057995907962322235,
808
- 0.025125017389655113,
809
- 0.06402861326932907,
810
- 0.046355463564395905,
811
- 0.03033997118473053,
812
- 0.06708943098783493,
813
- 0.05130421370267868,
814
- 0.04817532002925873,
815
- 0.03233150392770767,
816
- 0.041051946580410004,
817
- 0.06357830762863159,
818
- 0.08221856504678726,
819
- 0.05443323031067848,
820
- 0.028998034074902534,
821
- 0.08684802800416946,
822
- 0.0610925555229187,
823
- 0.0336371473968029,
824
- 0.023472048342227936,
825
- 0.06078788638114929,
826
- 0.05081494152545929,
827
- 0.05256975442171097,
828
- 0.042881276458501816,
829
- 0.031977828592061996,
830
- 0.03962726891040802,
831
- 0.06724098324775696,
832
- 0.05326463282108307,
833
- 0.04372230917215347,
834
- 0.04472571983933449,
835
- 0.052076928317546844,
836
- 0.042826779186725616,
837
- 0.03869928792119026,
838
- 0.02201938070356846,
839
- 0.04879137873649597,
840
- 0.02734885923564434,
841
- 0.05175810307264328,
842
- 0.04561843350529671,
843
- 0.04908981919288635,
844
- 0.045671574771404266,
845
- 0.04992988705635071,
846
- 0.04679465293884277,
847
- 0.0342470221221447,
848
- 0.04132283851504326,
849
- 0.04431803524494171,
850
- 0.04189082980155945,
851
- 0.0505763441324234,
852
- 0.05214542895555496,
853
- 0.047025106847286224,
854
- 0.04752563685178757,
855
- 0.04064689949154854,
856
- 0.04012472555041313,
857
- 0.03914778679609299,
858
- 0.04934476315975189,
859
- 0.051845304667949677,
860
- 0.028930390253663063,
861
- 0.04640305042266846,
862
- 0.03168107569217682,
863
- 0.03692198544740677,
864
- 0.041651077568531036,
865
- 0.05133098363876343,
866
- 0.024502430111169815,
867
- 0.04329643025994301,
868
- 0.031341951340436935,
869
- 0.04551147669553757,
870
- 0.0501837432384491,
871
- 0.03210654854774475,
872
- 0.041025444865226746,
873
- 0.03432022035121918,
874
- 0.0535600446164608,
875
- 0.03710262104868889,
876
- 0.051223304122686386,
877
- 0.02310934104025364,
878
- 0.04842713102698326,
879
- 0.04860638454556465,
880
- 0.029162120074033737,
881
- 0.03430991619825363,
882
- 0.04999687895178795,
883
- 0.042598988860845566,
884
- 0.03905525058507919,
885
- 0.03396385908126831,
886
- 0.04466875270009041,
887
- 0.04830180108547211,
888
- 0.048130013048648834,
889
- 0.03087255358695984,
890
- 0.040513940155506134,
891
- 0.029271963983774185,
892
- 0.04198697581887245,
893
- 0.037133827805519104,
894
- 0.04073633253574371,
895
- 0.04200948029756546,
896
- 0.032768625766038895,
897
- 0.03521694615483284,
898
- 0.03274751082062721,
899
- 0.040215421468019485,
900
- 0.03223889321088791,
901
- 0.02875204011797905,
902
- 0.031020455062389374,
903
- 0.05193880572915077,
904
- 0.03394973650574684,
905
- 0.046916697174310684,
906
- 0.04076382517814636,
907
- 0.030086800456047058,
908
- 0.03009340539574623,
909
- 0.031167635694146156,
910
- 0.03662469983100891,
911
- 0.029327519237995148,
912
- 0.02654491364955902,
913
- 0.04122946411371231
914
  ],
915
  "denoise_loss": [],
916
  "ortho_loss": [
917
- 0.10270898044109344,
918
- 0.045592378824949265,
919
- 0.034897129982709885,
920
- 0.03289920464158058,
921
- 0.03318662568926811,
922
- 0.035863105207681656,
923
- 0.03718609735369682,
924
- 0.04016987606883049,
925
- 0.04869673773646355,
926
- 0.053654879331588745,
927
- 0.061492759734392166,
928
- 0.06294921040534973,
929
- 0.06910595297813416,
930
- 0.07273681461811066,
931
- 0.076898954808712,
932
- 0.0958031639456749,
933
- 0.1058020293712616,
934
- 0.11720982193946838,
935
- 0.13132666051387787,
936
- 0.1452067792415619,
937
- 0.15491452813148499,
938
- 0.16184890270233154,
939
- 0.17446120083332062,
940
- 0.18189102411270142,
941
- 0.1888672560453415,
942
- 0.19659653306007385,
943
- 0.1996685415506363,
944
- 0.20556356012821198,
945
- 0.2079426646232605,
946
- 0.21441443264484406,
947
- 0.2170758992433548,
948
- 0.22126887738704681,
949
- 0.22582681477069855,
950
- 0.22605378925800323,
951
- 0.2280348688364029,
952
- 0.2285757064819336,
953
- 0.22907176613807678,
954
- 0.23065848648548126,
955
- 0.23264732956886292,
956
- 0.234690859913826,
957
- 0.23757733404636383,
958
- 0.23970840871334076,
959
- 0.2384733259677887,
960
- 0.23657508194446564,
961
- 0.23852205276489258,
962
- 0.24019040167331696,
963
- 0.23936468362808228,
964
- 0.23304446041584015,
965
- 0.23387999832630157,
966
- 0.2349344789981842,
967
- 0.23946575820446014,
968
- 0.24182644486427307,
969
- 0.24514825642108917,
970
- 0.2487141191959381,
971
- 0.2516993284225464,
972
- 0.2516952455043793,
973
- 0.2530873715877533,
974
- 0.2569259703159332,
975
- 0.2646262049674988,
976
- 0.2720961272716522,
977
- 0.27863892912864685,
978
- 0.2827668786048889,
979
- 0.28322896361351013,
980
- 0.29026034474372864,
981
- 0.296204149723053,
982
- 0.2996149957180023,
983
- 0.3005698323249817,
984
- 0.30707406997680664,
985
- 0.3101491630077362,
986
- 0.3167986273765564,
987
- 0.3269317150115967,
988
- 0.32879483699798584,
989
- 0.33054113388061523,
990
- 0.33136507868766785,
991
- 0.3334370255470276,
992
- 0.3420204818248749,
993
- 0.34395188093185425,
994
- 0.3462192118167877,
995
- 0.350506067276001,
996
- 0.3514798581600189,
997
- 0.35246649384498596,
998
- 0.3512493073940277,
999
- 0.3530470132827759,
1000
- 0.355428546667099,
1001
- 0.359707772731781,
1002
- 0.3637158274650574,
1003
- 0.3649544417858124,
1004
- 0.3662114441394806,
1005
- 0.3675302267074585,
1006
- 0.37116730213165283,
1007
- 0.37062546610832214,
1008
- 0.37135010957717896,
1009
- 0.3697737455368042,
1010
- 0.3697727620601654,
1011
- 0.3714151084423065,
1012
- 0.37123236060142517,
1013
- 0.3738124966621399,
1014
- 0.3752833604812622,
1015
- 0.37488511204719543,
1016
- 0.3777393102645874,
1017
- 0.37878528237342834,
1018
- 0.3812442421913147,
1019
- 0.38351762294769287,
1020
- 0.38525545597076416,
1021
- 0.3856000006198883,
1022
- 0.3862100839614868,
1023
- 0.3856704533100128,
1024
- 0.38774314522743225,
1025
- 0.38804271817207336,
1026
- 0.3885641396045685,
1027
- 0.38839849829673767,
1028
- 0.3905911147594452,
1029
- 0.39113733172416687,
1030
- 0.39186158776283264,
1031
- 0.39222121238708496,
1032
- 0.39306116104125977,
1033
- 0.3945384621620178,
1034
- 0.39511334896087646,
1035
- 0.39469024538993835,
1036
- 0.39563339948654175,
1037
- 0.39637646079063416,
1038
- 0.3954394459724426,
1039
- 0.39604392647743225,
1040
- 0.3968430161476135,
1041
- 0.3972108066082001,
1042
- 0.39802664518356323,
1043
- 0.4002288281917572,
1044
- 0.4006965458393097,
1045
- 0.40092286467552185,
1046
- 0.4012592136859894,
1047
- 0.4014245271682739,
1048
- 0.4025733470916748,
1049
- 0.4031515419483185,
1050
- 0.4036944806575775,
1051
- 0.40446820855140686,
1052
- 0.40457797050476074,
1053
- 0.4052768647670746,
1054
- 0.4059322774410248,
1055
- 0.4069337546825409,
1056
- 0.4073435664176941,
1057
- 0.40719661116600037,
1058
- 0.40762969851493835,
1059
- 0.40837234258651733,
1060
- 0.40862128138542175,
1061
- 0.4101361334323883,
1062
- 0.41058194637298584,
1063
- 0.4111683964729309,
1064
- 0.4115133285522461,
1065
- 0.41178953647613525,
1066
- 0.41227221488952637
1067
  ],
1068
  "lr": [
1069
- 7.840000000000001e-05,
1070
- 8e-05,
1071
- 8e-05,
1072
- 8e-05,
1073
- 8e-05,
1074
- 8e-05,
1075
- 8e-05,
1076
- 8e-05,
1077
- 8e-05,
1078
- 8e-05,
1079
- 8e-05,
1080
- 8e-05,
1081
- 8e-05,
1082
- 8e-05,
1083
- 8e-05,
1084
- 8e-05,
1085
- 8e-05,
1086
- 8e-05,
1087
- 8e-05,
1088
- 8e-05,
1089
- 8e-05,
1090
- 8e-05,
1091
- 8e-05,
1092
- 8e-05,
1093
- 8e-05,
1094
- 8e-05,
1095
- 8e-05,
1096
- 8e-05,
1097
- 8e-05,
1098
- 8e-05,
1099
- 8e-05,
1100
- 8e-05,
1101
- 8e-05,
1102
- 8e-05,
1103
- 8e-05,
1104
- 8e-05,
1105
- 8e-05,
1106
- 8e-05,
1107
- 8e-05,
1108
- 8e-05,
1109
- 8e-05,
1110
- 8e-05,
1111
- 8e-05,
1112
- 8e-05,
1113
- 8e-05,
1114
- 8e-05,
1115
- 8e-05,
1116
- 8e-05,
1117
- 8e-05,
1118
- 8e-05,
1119
- 8e-05,
1120
- 8e-05,
1121
- 8e-05,
1122
- 8e-05,
1123
- 8e-05,
1124
- 8e-05,
1125
- 8e-05,
1126
- 8e-05,
1127
- 8e-05,
1128
- 8e-05,
1129
- 8e-05,
1130
- 8e-05,
1131
- 8e-05,
1132
- 8e-05,
1133
- 8e-05,
1134
- 8e-05,
1135
- 8e-05,
1136
- 8e-05,
1137
- 8e-05,
1138
- 8e-05,
1139
- 8e-05,
1140
- 8e-05,
1141
- 8e-05,
1142
- 8e-05,
1143
- 8e-05,
1144
- 8e-05,
1145
- 8e-05,
1146
- 8e-05,
1147
- 8e-05,
1148
- 8e-05,
1149
- 8e-05,
1150
- 8e-05,
1151
- 8e-05,
1152
- 8e-05,
1153
- 8e-05,
1154
- 8e-05,
1155
- 8e-05,
1156
- 8e-05,
1157
- 8e-05,
1158
- 8e-05,
1159
- 7.932818532818534e-05,
1160
- 7.816988416988418e-05,
1161
- 7.701158301158302e-05,
1162
- 7.585328185328185e-05,
1163
- 7.469498069498071e-05,
1164
- 7.353667953667954e-05,
1165
- 7.237837837837838e-05,
1166
- 7.122007722007721e-05,
1167
- 7.006177606177606e-05,
1168
- 6.890347490347492e-05,
1169
- 6.774517374517375e-05,
1170
- 6.65868725868726e-05,
1171
- 6.542857142857144e-05,
1172
- 6.427027027027027e-05,
1173
- 6.311196911196911e-05,
1174
- 6.121235521235521e-05,
1175
- 6.0054054054054064e-05,
1176
- 5.8895752895752895e-05,
1177
- 5.773745173745175e-05,
1178
- 5.6579150579150584e-05,
1179
- 5.542084942084943e-05,
1180
- 5.426254826254825e-05,
1181
- 5.310424710424711e-05,
1182
- 5.194594594594594e-05,
1183
- 5.0787644787644786e-05,
1184
- 4.9629343629343644e-05,
1185
- 4.8471042471042475e-05,
1186
- 4.7312741312741326e-05,
1187
- 4.615444015444014e-05,
1188
- 4.4996138996139e-05,
1189
- 4.309652509652511e-05,
1190
- 4.1938223938223946e-05,
1191
- 4.07799227799228e-05,
1192
- 3.962162162162162e-05,
1193
- 3.846332046332047e-05,
1194
- 3.73050193050193e-05,
1195
- 3.6146718146718155e-05,
1196
- 3.4988416988416986e-05,
1197
- 3.383011583011584e-05,
1198
- 3.267181467181467e-05,
1199
- 3.151351351351352e-05,
1200
- 3.0355212355212367e-05,
1201
- 2.9196911196911198e-05,
1202
- 2.8038610038610046e-05,
1203
- 2.6880308880308876e-05,
1204
- 2.4980694980694983e-05,
1205
- 2.3822393822393838e-05,
1206
- 2.266409266409267e-05,
1207
- 2.1505791505791517e-05,
1208
- 2.0347490347490348e-05,
1209
- 1.9189189189189195e-05,
1210
- 1.8030888030888026e-05,
1211
- 1.6872586872586878e-05,
1212
- 1.571428571428571e-05,
1213
- 1.455598455598456e-05,
1214
- 1.3397683397683389e-05,
1215
- 1.223938223938224e-05,
1216
- 1.1081081081081092e-05,
1217
- 9.92277992277992e-06,
1218
- 8.764478764478772e-06
1219
  ],
1220
  "emb_lr": [],
1221
  "eval_step": [
@@ -1231,520 +1231,520 @@
1231
  7788
1232
  ],
1233
  "eval_accuracy": [
1234
- 0.03,
1235
- 0.92,
 
 
 
1236
  0.95,
1237
  0.99,
1238
  1.0,
1239
- 1.0,
1240
- 1.0,
1241
- 1.0,
1242
- 1.0,
1243
  1.0
1244
  ]
1245
  },
1246
- "final_accuracy": 1.0,
1247
  "sft_eval": {
1248
  "config": {
1249
  "ops": "add_sub",
1250
  "K": null,
1251
  "mode": "sft",
1252
  "n_digits": 6,
1253
- "n_per_split": 50
1254
  },
1255
  "splits": {
1256
  "add_S0": {
1257
- "full_accuracy": 0.66,
1258
- "n_examples": 50,
1259
  "per_subtask": {
1260
  "SA": {
1261
- "accuracy": 0.9457627118644067,
1262
- "count": 295
1263
  },
1264
  "SS": {
1265
- "accuracy": 0.9272727272727272,
1266
- "count": 55
1267
  }
1268
  }
1269
  },
1270
  "add_S1": {
1271
- "full_accuracy": 0.78,
1272
- "n_examples": 50,
1273
  "per_subtask": {
1274
  "SA": {
1275
- "accuracy": 0.9761904761904762,
1276
- "count": 126
1277
  },
1278
  "SC": {
1279
- "accuracy": 0.9367088607594937,
1280
- "count": 79
1281
  },
1282
  "SS": {
1283
  "accuracy": 1.0,
1284
- "count": 21
1285
  },
1286
  "UC": {
1287
- "accuracy": 0.9758064516129032,
1288
- "count": 124
1289
  }
1290
  }
1291
  },
1292
  "add_S2": {
1293
- "full_accuracy": 0.42,
1294
- "n_examples": 50,
1295
  "per_subtask": {
1296
  "SA": {
1297
- "accuracy": 0.92,
1298
- "count": 75
1299
  },
1300
  "SC": {
1301
- "accuracy": 0.9193548387096774,
1302
- "count": 62
1303
  },
1304
  "SS": {
1305
- "accuracy": 0.8205128205128205,
1306
- "count": 39
1307
  },
1308
  "UC": {
1309
- "accuracy": 0.8378378378378378,
1310
- "count": 111
1311
  },
1312
  "US": {
1313
- "accuracy": 0.9047619047619048,
1314
- "count": 63
1315
  }
1316
  }
1317
  },
1318
  "add_S3": {
1319
- "full_accuracy": 0.34,
1320
- "n_examples": 50,
1321
  "per_subtask": {
1322
  "SA": {
1323
- "accuracy": 0.95,
1324
- "count": 60
1325
  },
1326
  "SC": {
1327
- "accuracy": 0.8947368421052632,
1328
- "count": 57
1329
  },
1330
  "SS": {
1331
  "accuracy": 1.0,
1332
- "count": 19
1333
  },
1334
  "UC": {
1335
- "accuracy": 0.7884615384615384,
1336
- "count": 104
1337
  },
1338
  "US": {
1339
- "accuracy": 0.8545454545454545,
1340
- "count": 110
1341
  }
1342
  }
1343
  },
1344
  "add_S4": {
1345
- "full_accuracy": 0.36,
1346
- "n_examples": 50,
1347
  "per_subtask": {
1348
  "SA": {
1349
  "accuracy": 1.0,
1350
- "count": 48
1351
  },
1352
  "SC": {
1353
- "accuracy": 0.9807692307692307,
1354
- "count": 52
1355
  },
1356
  "SS": {
1357
- "accuracy": 0.8571428571428571,
1358
- "count": 7
1359
  },
1360
  "UC": {
1361
- "accuracy": 0.7303370786516854,
1362
- "count": 89
1363
  },
1364
  "US": {
1365
- "accuracy": 0.6688311688311688,
1366
- "count": 154
1367
  }
1368
  }
1369
  },
1370
  "add_S5": {
1371
- "full_accuracy": 0.18,
1372
- "n_examples": 50,
1373
  "per_subtask": {
1374
  "SA": {
1375
  "accuracy": 1.0,
1376
- "count": 50
1377
  },
1378
  "SC": {
1379
- "accuracy": 0.98,
1380
- "count": 50
1381
  },
1382
  "UC": {
1383
- "accuracy": 0.44,
1384
- "count": 50
1385
  },
1386
  "US": {
1387
- "accuracy": 0.375,
1388
- "count": 200
1389
  }
1390
  }
1391
  },
1392
  "add_S6": {
1393
- "full_accuracy": 0.3,
1394
- "n_examples": 50,
1395
  "per_subtask": {
1396
  "SC": {
1397
  "accuracy": 1.0,
1398
- "count": 50
1399
  },
1400
  "UC": {
1401
- "accuracy": 0.34,
1402
- "count": 50
1403
  },
1404
  "US": {
1405
- "accuracy": 0.452,
1406
- "count": 250
1407
  }
1408
  }
1409
  },
1410
  "add_random": {
1411
- "full_accuracy": 0.795,
1412
  "n_examples": 200,
1413
  "per_subtask": {
1414
  "SA": {
1415
- "accuracy": 0.9791183294663574,
1416
- "count": 431
1417
  },
1418
  "SC": {
1419
- "accuracy": 0.9778481012658228,
1420
- "count": 316
1421
  },
1422
  "SS": {
1423
- "accuracy": 0.8717948717948718,
1424
- "count": 39
1425
  },
1426
  "UC": {
1427
- "accuracy": 0.95,
1428
- "count": 560
1429
  },
1430
  "US": {
1431
- "accuracy": 0.9259259259259259,
1432
- "count": 54
1433
  }
1434
  }
1435
  },
1436
  "add_C3": {
1437
- "full_accuracy": 0.58,
1438
- "n_examples": 50,
1439
  "per_subtask": {
1440
  "SA": {
1441
  "accuracy": 1.0,
1442
- "count": 150
1443
  },
1444
  "SC": {
1445
  "accuracy": 1.0,
1446
- "count": 50
1447
  },
1448
  "UC": {
1449
- "accuracy": 0.8365384615384616,
1450
- "count": 104
1451
  },
1452
  "US": {
1453
- "accuracy": 0.8260869565217391,
1454
- "count": 46
1455
  }
1456
  }
1457
  },
1458
  "add_C4": {
1459
- "full_accuracy": 0.42,
1460
- "n_examples": 50,
1461
  "per_subtask": {
1462
  "SA": {
1463
- "accuracy": 0.99,
1464
- "count": 100
1465
  },
1466
  "SC": {
1467
  "accuracy": 1.0,
1468
- "count": 50
1469
  },
1470
  "UC": {
1471
- "accuracy": 0.8130081300813008,
1472
- "count": 123
1473
  },
1474
  "US": {
1475
- "accuracy": 0.6883116883116883,
1476
- "count": 77
1477
  }
1478
  }
1479
  },
1480
  "add_C5": {
1481
- "full_accuracy": 0.32,
1482
- "n_examples": 50,
1483
  "per_subtask": {
1484
  "SA": {
1485
  "accuracy": 1.0,
1486
- "count": 50
1487
  },
1488
  "SC": {
1489
- "accuracy": 0.98,
1490
- "count": 50
1491
  },
1492
  "UC": {
1493
- "accuracy": 0.7792207792207793,
1494
- "count": 154
1495
  },
1496
  "US": {
1497
- "accuracy": 0.8541666666666666,
1498
- "count": 96
1499
  }
1500
  }
1501
  },
1502
  "add_C6": {
1503
- "full_accuracy": 0.28,
1504
- "n_examples": 50,
1505
  "per_subtask": {
1506
  "SC": {
1507
  "accuracy": 1.0,
1508
- "count": 50
1509
  },
1510
  "UC": {
1511
- "accuracy": 0.7692307692307693,
1512
- "count": 182
1513
  },
1514
  "US": {
1515
- "accuracy": 0.7711864406779662,
1516
- "count": 118
1517
  }
1518
  }
1519
  },
1520
  "sub_M0": {
1521
- "full_accuracy": 0.64,
1522
- "n_examples": 50,
1523
  "per_subtask": {
1524
  "MD": {
1525
- "accuracy": 0.935374149659864,
1526
- "count": 294
1527
  },
1528
  "ME": {
1529
  "accuracy": 1.0,
1530
- "count": 56
1531
  }
1532
  }
1533
  },
1534
  "sub_M1": {
1535
- "full_accuracy": 0.84,
1536
- "n_examples": 50,
1537
  "per_subtask": {
1538
  "MD": {
1539
- "accuracy": 0.958041958041958,
1540
- "count": 143
1541
  },
1542
  "MB": {
1543
- "accuracy": 1.0,
1544
- "count": 69
1545
  },
1546
  "ME": {
1547
  "accuracy": 1.0,
1548
- "count": 15
1549
  },
1550
  "UB": {
1551
- "accuracy": 0.975609756097561,
1552
- "count": 123
1553
  }
1554
  }
1555
  },
1556
  "sub_M2": {
1557
- "full_accuracy": 0.36,
1558
- "n_examples": 50,
1559
  "per_subtask": {
1560
  "MD": {
1561
- "accuracy": 0.9351851851851852,
1562
- "count": 108
1563
  },
1564
  "MB": {
1565
  "accuracy": 1.0,
1566
- "count": 52
1567
  },
1568
  "ME": {
1569
- "accuracy": 0.9615384615384616,
1570
- "count": 52
1571
  },
1572
  "UB": {
1573
- "accuracy": 0.6551724137931034,
1574
- "count": 87
1575
  },
1576
  "UD": {
1577
  "accuracy": 1.0,
1578
- "count": 51
1579
  }
1580
  }
1581
  },
1582
  "sub_M3": {
1583
- "full_accuracy": 0.12,
1584
- "n_examples": 50,
1585
  "per_subtask": {
1586
  "MD": {
1587
- "accuracy": 0.9893617021276596,
1588
- "count": 94
1589
  },
1590
  "MB": {
1591
- "accuracy": 0.9803921568627451,
1592
- "count": 51
1593
  },
1594
  "ME": {
1595
  "accuracy": 1.0,
1596
- "count": 25
1597
  },
1598
  "UB": {
1599
- "accuracy": 0.6410256410256411,
1600
- "count": 78
1601
  },
1602
  "UD": {
1603
- "accuracy": 0.6078431372549019,
1604
- "count": 102
1605
  }
1606
  }
1607
  },
1608
  "sub_M4": {
1609
- "full_accuracy": 0.06,
1610
- "n_examples": 50,
1611
  "per_subtask": {
1612
  "MD": {
1613
- "accuracy": 0.99,
1614
- "count": 100
1615
  },
1616
  "MB": {
1617
  "accuracy": 1.0,
1618
- "count": 50
1619
  },
1620
  "UB": {
1621
- "accuracy": 0.66,
1622
- "count": 50
1623
  },
1624
  "UD": {
1625
- "accuracy": 0.34,
1626
- "count": 150
1627
  }
1628
  }
1629
  },
1630
  "sub_M5": {
1631
- "full_accuracy": 0.2,
1632
- "n_examples": 50,
1633
  "per_subtask": {
1634
  "MD": {
1635
  "accuracy": 1.0,
1636
- "count": 50
1637
  },
1638
  "MB": {
1639
  "accuracy": 1.0,
1640
- "count": 50
1641
  },
1642
  "UB": {
1643
- "accuracy": 0.82,
1644
- "count": 50
1645
  },
1646
  "UD": {
1647
- "accuracy": 0.38,
1648
- "count": 200
1649
  }
1650
  }
1651
  },
1652
  "sub_random": {
1653
- "full_accuracy": 0.775,
1654
  "n_examples": 200,
1655
  "per_subtask": {
1656
  "MD": {
1657
- "accuracy": 0.9693877551020408,
1658
- "count": 588
1659
  },
1660
  "MB": {
1661
- "accuracy": 0.9925373134328358,
1662
- "count": 268
1663
  },
1664
  "ME": {
1665
  "accuracy": 1.0,
1666
- "count": 60
1667
  },
1668
  "UB": {
1669
- "accuracy": 0.9328859060402684,
1670
- "count": 447
1671
  },
1672
  "UD": {
1673
- "accuracy": 0.8918918918918919,
1674
- "count": 37
1675
  }
1676
  }
1677
  },
1678
  "sub_B3": {
1679
- "full_accuracy": 0.56,
1680
- "n_examples": 50,
1681
  "per_subtask": {
1682
  "MD": {
1683
- "accuracy": 0.9933333333333333,
1684
- "count": 150
1685
  },
1686
  "MB": {
1687
  "accuracy": 1.0,
1688
- "count": 50
1689
  },
1690
  "UB": {
1691
- "accuracy": 0.8317757009345794,
1692
- "count": 107
1693
  },
1694
  "UD": {
1695
- "accuracy": 0.8372093023255814,
1696
- "count": 43
1697
  }
1698
  }
1699
  },
1700
  "sub_B4": {
1701
- "full_accuracy": 0.34,
1702
- "n_examples": 50,
1703
  "per_subtask": {
1704
  "MD": {
1705
  "accuracy": 1.0,
1706
- "count": 100
1707
  },
1708
  "MB": {
1709
  "accuracy": 1.0,
1710
- "count": 50
1711
  },
1712
  "UB": {
1713
- "accuracy": 0.8157894736842105,
1714
- "count": 114
1715
  },
1716
  "UD": {
1717
- "accuracy": 0.6046511627906976,
1718
- "count": 86
1719
  }
1720
  }
1721
  },
1722
  "sub_B5": {
1723
- "full_accuracy": 0.28,
1724
- "n_examples": 50,
1725
  "per_subtask": {
1726
  "MD": {
1727
  "accuracy": 1.0,
1728
- "count": 50
1729
  },
1730
  "MB": {
1731
  "accuracy": 1.0,
1732
- "count": 50
1733
  },
1734
  "UB": {
1735
- "accuracy": 0.7843137254901961,
1736
- "count": 153
1737
  },
1738
  "UD": {
1739
- "accuracy": 0.6597938144329897,
1740
- "count": 97
1741
  }
1742
  }
1743
  }
1744
  },
1745
  "summary": {
1746
- "overall_accuracy": 0.5107142857142857,
1747
- "total_examples": 1400,
1748
  "n_splits": 22
1749
  }
1750
  },
@@ -1754,160 +1754,160 @@
1754
  "K": 4,
1755
  "mode": "sorl",
1756
  "n_digits": 6,
1757
- "n_per_split": 50
1758
  },
1759
  "splits": {
1760
  "add_S0": {
1761
  "full_accuracy": 1.0,
1762
- "n_examples": 50,
1763
  "per_subtask": {
1764
  "SA": {
1765
  "accuracy": 1.0,
1766
- "count": 295
1767
  },
1768
  "SS": {
1769
  "accuracy": 1.0,
1770
- "count": 55
1771
  }
1772
  }
1773
  },
1774
  "add_S1": {
1775
  "full_accuracy": 1.0,
1776
- "n_examples": 50,
1777
  "per_subtask": {
1778
  "SA": {
1779
  "accuracy": 1.0,
1780
- "count": 126
1781
  },
1782
  "SC": {
1783
  "accuracy": 1.0,
1784
- "count": 79
1785
  },
1786
  "SS": {
1787
  "accuracy": 1.0,
1788
- "count": 21
1789
  },
1790
  "UC": {
1791
  "accuracy": 1.0,
1792
- "count": 124
1793
  }
1794
  }
1795
  },
1796
  "add_S2": {
1797
  "full_accuracy": 1.0,
1798
- "n_examples": 50,
1799
  "per_subtask": {
1800
  "SA": {
1801
  "accuracy": 1.0,
1802
- "count": 75
1803
  },
1804
  "SC": {
1805
  "accuracy": 1.0,
1806
- "count": 62
1807
  },
1808
  "SS": {
1809
  "accuracy": 1.0,
1810
- "count": 39
1811
  },
1812
  "UC": {
1813
  "accuracy": 1.0,
1814
- "count": 111
1815
  },
1816
  "US": {
1817
  "accuracy": 1.0,
1818
- "count": 63
1819
  }
1820
  }
1821
  },
1822
  "add_S3": {
1823
  "full_accuracy": 1.0,
1824
- "n_examples": 50,
1825
  "per_subtask": {
1826
  "SA": {
1827
  "accuracy": 1.0,
1828
- "count": 60
1829
  },
1830
  "SC": {
1831
  "accuracy": 1.0,
1832
- "count": 57
1833
  },
1834
  "SS": {
1835
  "accuracy": 1.0,
1836
- "count": 19
1837
  },
1838
  "UC": {
1839
  "accuracy": 1.0,
1840
- "count": 104
1841
  },
1842
  "US": {
1843
  "accuracy": 1.0,
1844
- "count": 110
1845
  }
1846
  }
1847
  },
1848
  "add_S4": {
1849
  "full_accuracy": 1.0,
1850
- "n_examples": 50,
1851
  "per_subtask": {
1852
  "SA": {
1853
  "accuracy": 1.0,
1854
- "count": 48
1855
  },
1856
  "SC": {
1857
  "accuracy": 1.0,
1858
- "count": 52
1859
  },
1860
  "SS": {
1861
  "accuracy": 1.0,
1862
- "count": 7
1863
  },
1864
  "UC": {
1865
  "accuracy": 1.0,
1866
- "count": 89
1867
  },
1868
  "US": {
1869
  "accuracy": 1.0,
1870
- "count": 154
1871
  }
1872
  }
1873
  },
1874
  "add_S5": {
1875
- "full_accuracy": 1.0,
1876
- "n_examples": 50,
1877
  "per_subtask": {
1878
  "SA": {
1879
  "accuracy": 1.0,
1880
- "count": 50
1881
  },
1882
  "SC": {
1883
  "accuracy": 1.0,
1884
- "count": 50
1885
  },
1886
  "UC": {
1887
- "accuracy": 1.0,
1888
- "count": 50
1889
  },
1890
  "US": {
1891
  "accuracy": 1.0,
1892
- "count": 200
1893
  }
1894
  }
1895
  },
1896
  "add_S6": {
1897
- "full_accuracy": 1.0,
1898
- "n_examples": 50,
1899
  "per_subtask": {
1900
  "SC": {
1901
  "accuracy": 1.0,
1902
- "count": 50
1903
  },
1904
  "UC": {
1905
- "accuracy": 1.0,
1906
- "count": 50
1907
  },
1908
  "US": {
1909
  "accuracy": 1.0,
1910
- "count": 250
1911
  }
1912
  }
1913
  },
@@ -1917,239 +1917,239 @@
1917
  "per_subtask": {
1918
  "SA": {
1919
  "accuracy": 1.0,
1920
- "count": 431
1921
  },
1922
  "SC": {
1923
  "accuracy": 1.0,
1924
- "count": 316
1925
  },
1926
  "SS": {
1927
  "accuracy": 1.0,
1928
- "count": 39
1929
  },
1930
  "UC": {
1931
  "accuracy": 1.0,
1932
- "count": 560
1933
  },
1934
  "US": {
1935
  "accuracy": 1.0,
1936
- "count": 54
1937
  }
1938
  }
1939
  },
1940
  "add_C3": {
1941
  "full_accuracy": 1.0,
1942
- "n_examples": 50,
1943
  "per_subtask": {
1944
  "SA": {
1945
  "accuracy": 1.0,
1946
- "count": 150
1947
  },
1948
  "SC": {
1949
  "accuracy": 1.0,
1950
- "count": 50
1951
  },
1952
  "UC": {
1953
  "accuracy": 1.0,
1954
- "count": 104
1955
  },
1956
  "US": {
1957
  "accuracy": 1.0,
1958
- "count": 46
1959
  }
1960
  }
1961
  },
1962
  "add_C4": {
1963
  "full_accuracy": 1.0,
1964
- "n_examples": 50,
1965
  "per_subtask": {
1966
  "SA": {
1967
  "accuracy": 1.0,
1968
- "count": 100
1969
  },
1970
  "SC": {
1971
  "accuracy": 1.0,
1972
- "count": 50
1973
  },
1974
  "UC": {
1975
  "accuracy": 1.0,
1976
- "count": 123
1977
  },
1978
  "US": {
1979
  "accuracy": 1.0,
1980
- "count": 77
1981
  }
1982
  }
1983
  },
1984
  "add_C5": {
1985
  "full_accuracy": 1.0,
1986
- "n_examples": 50,
1987
  "per_subtask": {
1988
  "SA": {
1989
  "accuracy": 1.0,
1990
- "count": 50
1991
  },
1992
  "SC": {
1993
  "accuracy": 1.0,
1994
- "count": 50
1995
  },
1996
  "UC": {
1997
  "accuracy": 1.0,
1998
- "count": 154
1999
  },
2000
  "US": {
2001
  "accuracy": 1.0,
2002
- "count": 96
2003
  }
2004
  }
2005
  },
2006
  "add_C6": {
2007
  "full_accuracy": 1.0,
2008
- "n_examples": 50,
2009
  "per_subtask": {
2010
  "SC": {
2011
  "accuracy": 1.0,
2012
- "count": 50
2013
  },
2014
  "UC": {
2015
  "accuracy": 1.0,
2016
- "count": 182
2017
  },
2018
  "US": {
2019
  "accuracy": 1.0,
2020
- "count": 118
2021
  }
2022
  }
2023
  },
2024
  "sub_M0": {
2025
  "full_accuracy": 1.0,
2026
- "n_examples": 50,
2027
  "per_subtask": {
2028
  "MD": {
2029
  "accuracy": 1.0,
2030
- "count": 294
2031
  },
2032
  "ME": {
2033
  "accuracy": 1.0,
2034
- "count": 56
2035
  }
2036
  }
2037
  },
2038
  "sub_M1": {
2039
  "full_accuracy": 1.0,
2040
- "n_examples": 50,
2041
  "per_subtask": {
2042
  "MD": {
2043
  "accuracy": 1.0,
2044
- "count": 143
2045
  },
2046
  "MB": {
2047
  "accuracy": 1.0,
2048
- "count": 69
2049
  },
2050
  "ME": {
2051
  "accuracy": 1.0,
2052
- "count": 15
2053
  },
2054
  "UB": {
2055
  "accuracy": 1.0,
2056
- "count": 123
2057
  }
2058
  }
2059
  },
2060
  "sub_M2": {
2061
  "full_accuracy": 1.0,
2062
- "n_examples": 50,
2063
  "per_subtask": {
2064
  "MD": {
2065
  "accuracy": 1.0,
2066
- "count": 108
2067
  },
2068
  "MB": {
2069
  "accuracy": 1.0,
2070
- "count": 52
2071
  },
2072
  "ME": {
2073
  "accuracy": 1.0,
2074
- "count": 52
2075
  },
2076
  "UB": {
2077
  "accuracy": 1.0,
2078
- "count": 87
2079
  },
2080
  "UD": {
2081
  "accuracy": 1.0,
2082
- "count": 51
2083
  }
2084
  }
2085
  },
2086
  "sub_M3": {
2087
  "full_accuracy": 1.0,
2088
- "n_examples": 50,
2089
  "per_subtask": {
2090
  "MD": {
2091
  "accuracy": 1.0,
2092
- "count": 94
2093
  },
2094
  "MB": {
2095
  "accuracy": 1.0,
2096
- "count": 51
2097
  },
2098
  "ME": {
2099
  "accuracy": 1.0,
2100
- "count": 25
2101
  },
2102
  "UB": {
2103
  "accuracy": 1.0,
2104
- "count": 78
2105
  },
2106
  "UD": {
2107
  "accuracy": 1.0,
2108
- "count": 102
2109
  }
2110
  }
2111
  },
2112
  "sub_M4": {
2113
- "full_accuracy": 1.0,
2114
- "n_examples": 50,
2115
  "per_subtask": {
2116
  "MD": {
2117
  "accuracy": 1.0,
2118
- "count": 100
2119
  },
2120
  "MB": {
2121
  "accuracy": 1.0,
2122
- "count": 50
2123
  },
2124
  "UB": {
2125
- "accuracy": 1.0,
2126
- "count": 50
2127
  },
2128
  "UD": {
2129
  "accuracy": 1.0,
2130
- "count": 150
2131
  }
2132
  }
2133
  },
2134
  "sub_M5": {
2135
- "full_accuracy": 1.0,
2136
- "n_examples": 50,
2137
  "per_subtask": {
2138
  "MD": {
2139
  "accuracy": 1.0,
2140
- "count": 50
2141
  },
2142
  "MB": {
2143
  "accuracy": 1.0,
2144
- "count": 50
2145
  },
2146
  "UB": {
2147
- "accuracy": 1.0,
2148
- "count": 50
2149
  },
2150
  "UD": {
2151
  "accuracy": 1.0,
2152
- "count": 200
2153
  }
2154
  }
2155
  },
@@ -2159,99 +2159,99 @@
2159
  "per_subtask": {
2160
  "MD": {
2161
  "accuracy": 1.0,
2162
- "count": 588
2163
  },
2164
  "MB": {
2165
  "accuracy": 1.0,
2166
- "count": 268
2167
  },
2168
  "ME": {
2169
  "accuracy": 1.0,
2170
- "count": 60
2171
  },
2172
  "UB": {
2173
  "accuracy": 1.0,
2174
- "count": 447
2175
  },
2176
  "UD": {
2177
  "accuracy": 1.0,
2178
- "count": 37
2179
  }
2180
  }
2181
  },
2182
  "sub_B3": {
2183
  "full_accuracy": 1.0,
2184
- "n_examples": 50,
2185
  "per_subtask": {
2186
  "MD": {
2187
  "accuracy": 1.0,
2188
- "count": 150
2189
  },
2190
  "MB": {
2191
  "accuracy": 1.0,
2192
- "count": 50
2193
  },
2194
  "UB": {
2195
  "accuracy": 1.0,
2196
- "count": 107
2197
  },
2198
  "UD": {
2199
  "accuracy": 1.0,
2200
- "count": 43
2201
  }
2202
  }
2203
  },
2204
  "sub_B4": {
2205
  "full_accuracy": 1.0,
2206
- "n_examples": 50,
2207
  "per_subtask": {
2208
  "MD": {
2209
  "accuracy": 1.0,
2210
- "count": 100
2211
  },
2212
  "MB": {
2213
  "accuracy": 1.0,
2214
- "count": 50
2215
  },
2216
  "UB": {
2217
  "accuracy": 1.0,
2218
- "count": 114
2219
  },
2220
  "UD": {
2221
  "accuracy": 1.0,
2222
- "count": 86
2223
  }
2224
  }
2225
  },
2226
  "sub_B5": {
2227
  "full_accuracy": 1.0,
2228
- "n_examples": 50,
2229
  "per_subtask": {
2230
  "MD": {
2231
  "accuracy": 1.0,
2232
- "count": 50
2233
  },
2234
  "MB": {
2235
  "accuracy": 1.0,
2236
- "count": 50
2237
  },
2238
  "UB": {
2239
  "accuracy": 1.0,
2240
- "count": 153
2241
  },
2242
  "UD": {
2243
  "accuracy": 1.0,
2244
- "count": 97
2245
  }
2246
  }
2247
  }
2248
  },
2249
  "summary": {
2250
- "overall_accuracy": 1.0,
2251
- "total_examples": 1400,
2252
  "n_splits": 22
2253
  }
2254
  },
2255
- "sorl_overall_accuracy": 1.0,
2256
- "sft_overall_accuracy": 0.5107142857142857
2257
  }
 
153
  7788
154
  ],
155
  "loss": [
156
+ 14.632190704345703,
157
+ 9.926382064819336,
158
+ 6.634365081787109,
159
+ 4.12091064453125,
160
+ 2.3600664138793945,
161
+ 2.5965561866760254,
162
+ 2.2668251991271973,
163
+ 2.4945991039276123,
164
+ 1.87929368019104,
165
+ 1.770228624343872,
166
+ 1.4810309410095215,
167
+ 1.115319013595581,
168
+ 1.2603116035461426,
169
+ 1.118563175201416,
170
+ 0.7639645338058472,
171
+ 0.5783902406692505,
172
+ -0.2102416753768921,
173
+ -1.0637309551239014,
174
+ -2.982658863067627,
175
+ -5.1272735595703125,
176
+ -6.820440769195557,
177
+ -8.708982467651367,
178
+ -9.34764575958252,
179
+ -9.479778289794922,
180
+ -9.714715003967285,
181
+ -9.847146987915039,
182
+ -10.891656875610352,
183
+ -10.567233085632324,
184
+ -10.487039566040039,
185
+ -10.561330795288086,
186
+ -11.278342247009277,
187
+ -11.53654956817627,
188
+ -11.39672565460205,
189
+ -12.42699146270752,
190
+ -12.283132553100586,
191
+ -12.111838340759277,
192
+ -12.558882713317871,
193
+ -12.664121627807617,
194
+ -11.877008438110352,
195
+ -13.080121040344238,
196
+ -12.89445972442627,
197
+ -13.657825469970703,
198
+ -13.041352272033691,
199
+ -12.739060401916504,
200
+ -13.011455535888672,
201
+ -13.518850326538086,
202
+ -13.68348217010498,
203
+ -13.794760704040527,
204
+ -12.652961730957031,
205
+ -13.282352447509766,
206
+ -12.864669799804688,
207
+ -12.425497055053711,
208
+ -13.485628128051758,
209
+ -13.69277286529541,
210
+ -13.639493942260742,
211
+ -13.366686820983887,
212
+ -13.520065307617188,
213
+ -13.455315589904785,
214
+ -13.581616401672363,
215
+ -13.953703880310059,
216
+ -13.787495613098145,
217
+ -13.657554626464844,
218
+ -13.825128555297852,
219
+ -13.480307579040527,
220
+ -12.544189453125,
221
+ -11.929388999938965,
222
+ -10.827520370483398,
223
+ -8.075313568115234,
224
+ -6.391434192657471,
225
+ -5.907987594604492,
226
+ -4.740344047546387,
227
+ -5.025309085845947,
228
+ -4.2770867347717285,
229
+ -4.229391574859619,
230
+ -3.865729570388794,
231
+ -4.085846424102783,
232
+ -3.6969783306121826,
233
+ -3.788874387741089,
234
+ -3.3547849655151367,
235
+ -3.1135661602020264,
236
+ -2.8369789123535156,
237
+ -2.6105422973632812,
238
+ -3.406431198120117,
239
+ -2.858949661254883,
240
+ -2.1879334449768066,
241
+ -2.340407133102417,
242
+ -1.6988248825073242,
243
+ -1.7582203149795532,
244
+ -2.0069541931152344,
245
+ -2.3115696907043457,
246
+ -1.6048082113265991,
247
+ -3.4057414531707764,
248
+ -1.5541704893112183,
249
+ -1.587241768836975,
250
+ -1.341800570487976,
251
+ -1.3259270191192627,
252
+ -1.2093465328216553,
253
+ -1.1008269786834717,
254
+ -0.8763017654418945,
255
+ -1.4300707578659058,
256
+ -1.191908597946167,
257
+ -1.174930453300476,
258
+ -1.2244458198547363,
259
+ -0.4350616931915283,
260
+ -1.2295445203781128,
261
+ -0.4361853301525116,
262
+ -0.5482154488563538,
263
+ -1.4029738903045654,
264
+ -0.9040775895118713,
265
+ -0.5001223087310791,
266
+ -0.3795071244239807,
267
+ -0.7955602407455444,
268
+ -0.8618952631950378,
269
+ -0.6030458807945251,
270
+ -0.8650072813034058,
271
+ -0.632997989654541,
272
+ -0.8306871652603149,
273
+ -0.6155402660369873,
274
+ -0.47851070761680603,
275
+ -0.4381093382835388,
276
+ -0.7446098327636719,
277
+ -0.604732871055603,
278
+ -0.586620569229126,
279
+ -0.5812572240829468,
280
+ -0.5657588839530945,
281
+ -0.40892261266708374,
282
+ -0.34598445892333984,
283
+ -0.37908679246902466,
284
+ -0.6343741416931152,
285
+ -0.48928260803222656,
286
+ -0.4414480924606323,
287
+ -0.5256525874137878,
288
+ -0.5549529790878296,
289
+ -0.5228503942489624,
290
+ -0.43323570489883423,
291
+ -0.35606762766838074,
292
+ -0.3718273639678955,
293
+ -0.3244103789329529,
294
+ -0.31916630268096924,
295
+ -0.36536484956741333,
296
+ -0.5733921527862549,
297
+ -0.36300128698349,
298
+ -0.16675259172916412,
299
+ -0.3644050359725952,
300
+ -0.3043482303619385,
301
+ -0.24840393662452698,
302
+ -0.19103999435901642,
303
+ -0.1850191354751587,
304
+ -0.3407224416732788,
305
+ -0.25857996940612793
306
  ],
307
  "base_loss": [
308
+ 9.482434272766113,
309
+ 7.117786884307861,
310
+ 6.046176433563232,
311
+ 4.258971214294434,
312
+ 2.312073230743408,
313
+ 1.998913049697876,
314
+ 1.8657360076904297,
315
+ 1.941304087638855,
316
+ 1.8812999725341797,
317
+ 1.8264588117599487,
318
+ 1.827309250831604,
319
+ 1.793294906616211,
320
+ 1.8274389505386353,
321
+ 1.8220479488372803,
322
+ 1.8286134004592896,
323
+ 1.7788950204849243,
324
+ 1.8032491207122803,
325
+ 1.7887276411056519,
326
+ 2.006676197052002,
327
+ 1.9466220140457153,
328
+ 1.938077688217163,
329
+ 2.0098798274993896,
330
+ 1.9562937021255493,
331
+ 1.7426707744598389,
332
+ 1.8475419282913208,
333
+ 1.8222671747207642,
334
+ 1.7838033437728882,
335
+ 1.7463515996932983,
336
+ 1.697568655014038,
337
+ 1.7143851518630981,
338
+ 1.7419077157974243,
339
+ 1.7188345193862915,
340
+ 1.658122181892395,
341
+ 1.7801390886306763,
342
+ 1.6910394430160522,
343
+ 1.6635606288909912,
344
+ 1.7399853467941284,
345
+ 1.6727386713027954,
346
+ 1.5781800746917725,
347
+ 1.6815193891525269,
348
+ 1.6525733470916748,
349
+ 1.708761215209961,
350
+ 1.6608943939208984,
351
+ 1.6103297472000122,
352
+ 1.623249888420105,
353
+ 1.6843823194503784,
354
+ 1.7061597108840942,
355
+ 1.6853832006454468,
356
+ 1.5944339036941528,
357
+ 1.6551153659820557,
358
+ 1.5582751035690308,
359
+ 1.5246549844741821,
360
+ 1.6163057088851929,
361
+ 1.616803526878357,
362
+ 1.6256102323532104,
363
+ 1.5938681364059448,
364
+ 1.6049398183822632,
365
+ 1.5970059633255005,
366
+ 1.624014973640442,
367
+ 1.625469446182251,
368
+ 1.5937610864639282,
369
+ 1.5731550455093384,
370
+ 1.5809533596038818,
371
+ 1.5393472909927368,
372
+ 1.435717225074768,
373
+ 1.369104266166687,
374
+ 1.2582679986953735,
375
+ 0.9665323495864868,
376
+ 0.7821284532546997,
377
+ 0.7074981331825256,
378
+ 0.5917485356330872,
379
+ 0.6081733107566833,
380
+ 0.5498444437980652,
381
+ 0.5120163559913635,
382
+ 0.4534907341003418,
383
+ 0.4987371265888214,
384
+ 0.4344933032989502,
385
+ 0.4616098999977112,
386
+ 0.3905290961265564,
387
+ 0.36903122067451477,
388
+ 0.3468772768974304,
389
+ 0.3053329885005951,
390
+ 0.39532873034477234,
391
+ 0.33305686712265015,
392
+ 0.2736288011074066,
393
+ 0.27657410502433777,
394
+ 0.21591803431510925,
395
+ 0.20601941645145416,
396
+ 0.23737052083015442,
397
+ 0.27516016364097595,
398
+ 0.20490236580371857,
399
+ 0.4041613042354584,
400
+ 0.1861131340265274,
401
+ 0.19129757583141327,
402
+ 0.1886499673128128,
403
+ 0.18159404397010803,
404
+ 0.14922840893268585,
405
+ 0.13664014637470245,
406
+ 0.10598627477884293,
407
+ 0.1828942596912384,
408
+ 0.1439986377954483,
409
+ 0.14368221163749695,
410
+ 0.14707587659358978,
411
+ 0.07975024729967117,
412
+ 0.14613859355449677,
413
+ 0.06020959094166756,
414
+ 0.07016318291425705,
415
+ 0.1634124517440796,
416
+ 0.1087348610162735,
417
+ 0.082696333527565,
418
+ 0.07368756830692291,
419
+ 0.10071809589862823,
420
+ 0.10751090198755264,
421
+ 0.07716800272464752,
422
+ 0.10648422688245773,
423
+ 0.07751994580030441,
424
+ 0.09940018504858017,
425
+ 0.07651485502719879,
426
+ 0.05863216146826744,
427
+ 0.05505487695336342,
428
+ 0.09117519855499268,
429
+ 0.07521039247512817,
430
+ 0.07184553146362305,
431
+ 0.07176653295755386,
432
+ 0.0699726790189743,
433
+ 0.052560459822416306,
434
+ 0.044058240950107574,
435
+ 0.048487093299627304,
436
+ 0.08156915754079819,
437
+ 0.061087582260370255,
438
+ 0.06119650602340698,
439
+ 0.06394444406032562,
440
+ 0.07004927843809128,
441
+ 0.0659731775522232,
442
+ 0.05378962680697441,
443
+ 0.0477081723511219,
444
+ 0.04793006181716919,
445
+ 0.04166543111205101,
446
+ 0.04095941409468651,
447
+ 0.04708099737763405,
448
+ 0.07109672576189041,
449
+ 0.045931022614240646,
450
+ 0.024872872978448868,
451
+ 0.04558694362640381,
452
+ 0.03894834965467453,
453
+ 0.03414854779839516,
454
+ 0.027124684303998947,
455
+ 0.027090419083833694,
456
+ 0.044619057327508926,
457
+ 0.033715397119522095
458
  ],
459
  "info_loss": [
460
+ -0.12326622009277344,
461
+ -0.18317556381225586,
462
+ -0.21192121505737305,
463
+ -0.1614665985107422,
464
+ -0.09911632537841797,
465
+ -0.03676164150238037,
466
+ -0.05518639087677002,
467
+ -0.03937363624572754,
468
+ -0.09468269348144531,
469
+ -0.09933149814605713,
470
+ -0.127937912940979,
471
+ -0.1626497507095337,
472
+ -0.15077292919158936,
473
+ -0.16379308700561523,
474
+ -0.19910144805908203,
475
+ -0.20818078517913818,
476
+ -0.2778512239456177,
477
+ -0.351151704788208,
478
+ -0.5528711080551147,
479
+ -0.7527784109115601,
480
+ -0.9174032211303711,
481
+ -1.1097712516784668,
482
+ -1.1687355041503906,
483
+ -1.156583309173584,
484
+ -1.1916966438293457,
485
+ -1.1981340646743774,
486
+ -1.2985475063323975,
487
+ -1.2606419324874878,
488
+ -1.246760606765747,
489
+ -1.2560533285140991,
490
+ -1.331277847290039,
491
+ -1.3520653247833252,
492
+ -1.3316826820373535,
493
+ -1.4475840330123901,
494
+ -1.423694372177124,
495
+ -1.401245355606079,
496
+ -1.4543802738189697,
497
+ -1.456540822982788,
498
+ -1.3692126274108887,
499
+ -1.4987409114837646,
500
+ -1.4760082960128784,
501
+ -1.5583420991897583,
502
+ -1.4900978803634644,
503
+ -1.4563288688659668,
504
+ -1.4812694787979126,
505
+ -1.5390629768371582,
506
+ -1.5584094524383545,
507
+ -1.56727933883667,
508
+ -1.4423127174377441,
509
+ -1.5100535154342651,
510
+ -1.4591412544250488,
511
+ -1.4114735126495361,
512
+ -1.5255085229873657,
513
+ -1.547141432762146,
514
+ -1.54146146774292,
515
+ -1.510321855545044,
516
+ -1.5257158279418945,
517
+ -1.5199824571609497,
518
+ -1.5334408283233643,
519
+ -1.5722233057022095,
520
+ -1.5500802993774414,
521
+ -1.5357627868652344,
522
+ -1.552409052848816,
523
+ -1.5149730443954468,
524
+ -1.40906822681427,
525
+ -1.341101884841919,
526
+ -1.2200331687927246,
527
+ -0.9157827496528625,
528
+ -0.7277940511703491,
529
+ -0.6731217503547668,
530
+ -0.5456058979034424,
531
+ -0.5737265944480896,
532
+ -0.49359437823295593,
533
+ -0.48544979095458984,
534
+ -0.4402371644973755,
535
+ -0.467752605676651,
536
+ -0.42211639881134033,
537
+ -0.434103399515152,
538
+ -0.38376203179359436,
539
+ -0.3583239018917084,
540
+ -0.3261827230453491,
541
+ -0.29966747760772705,
542
+ -0.38840124011039734,
543
+ -0.32828328013420105,
544
+ -0.25409969687461853,
545
+ -0.2704025208950043,
546
+ -0.1985175758600235,
547
+ -0.20338541269302368,
548
+ -0.23216019570827484,
549
+ -0.26735031604766846,
550
+ -0.18867464363574982,
551
+ -0.38847246766090393,
552
+ -0.182339146733284,
553
+ -0.18704256415367126,
554
+ -0.1616264432668686,
555
+ -0.15969634056091309,
556
+ -0.14530818164348602,
557
+ -0.13175378739833832,
558
+ -0.10473348200321198,
559
+ -0.171867236495018,
560
+ -0.1426738202571869,
561
+ -0.13931553065776825,
562
+ -0.14417681097984314,
563
+ -0.05767478048801422,
564
+ -0.14531880617141724,
565
+ -0.05537816509604454,
566
+ -0.06925474852323532,
567
+ -0.162682443857193,
568
+ -0.10662886500358582,
569
+ -0.06461586803197861,
570
+ -0.05278106778860092,
571
+ -0.09546349942684174,
572
+ -0.10324031114578247,
573
+ -0.07626307010650635,
574
+ -0.10292515903711319,
575
+ -0.07728055119514465,
576
+ -0.09876345098018646,
577
+ -0.07488290220499039,
578
+ -0.05830881744623184,
579
+ -0.05468850955367088,
580
+ -0.09090279042720795,
581
+ -0.07504025101661682,
582
+ -0.07148993760347366,
583
+ -0.07156261801719666,
584
+ -0.0697956308722496,
585
+ -0.05241704359650612,
586
+ -0.04384676739573479,
587
+ -0.048265501856803894,
588
+ -0.07867752760648727,
589
+ -0.06092023849487305,
590
+ -0.0558161623775959,
591
+ -0.06381774693727493,
592
+ -0.06975483149290085,
593
+ -0.06581415981054306,
594
+ -0.053555652499198914,
595
+ -0.0474986732006073,
596
+ -0.04777195677161217,
597
+ -0.04158833995461464,
598
+ -0.04086068645119667,
599
+ -0.046969663351774216,
600
+ -0.07098674029111862,
601
+ -0.04583430290222168,
602
+ -0.02477315440773964,
603
+ -0.045496866106987,
604
+ -0.03886625915765762,
605
+ -0.033758021891117096,
606
+ -0.026911893859505653,
607
+ -0.026989782229065895,
608
+ -0.0445425882935524,
609
+ -0.03364324942231178
610
  ],
611
  "abs_loss": [
612
+ 3.8987743854522705,
613
+ 3.835925340652466,
614
+ 3.731152057647705,
615
+ 3.3448033332824707,
616
+ 2.9310805797576904,
617
+ 2.8018741607666016,
618
+ 2.832192897796631,
619
+ 2.8128607273101807,
620
+ 2.843754291534424,
621
+ 2.762322187423706,
622
+ 2.6791672706604004,
623
+ 2.8312129974365234,
624
+ 2.7969703674316406,
625
+ 2.793354034423828,
626
+ 2.753342628479004,
627
+ 2.7262606620788574,
628
+ 2.620635986328125,
629
+ 2.5968563556671143,
630
+ 2.31925106048584,
631
+ 2.0016016960144043,
632
+ 1.9219343662261963,
633
+ 1.7101284265518188,
634
+ 1.7175776958465576,
635
+ 1.6339759826660156,
636
+ 1.8100486993789673,
637
+ 1.4601774215698242,
638
+ 1.461230993270874,
639
+ 1.3801701068878174,
640
+ 1.3301787376403809,
641
+ 1.3739302158355713,
642
+ 1.587360143661499,
643
+ 1.3912031650543213,
644
+ 1.3633630275726318,
645
+ 1.4589648246765137,
646
+ 1.4376378059387207,
647
+ 1.2283248901367188,
648
+ 1.3686951398849487,
649
+ 1.261014461517334,
650
+ 1.1936320066452026,
651
+ 1.2106618881225586,
652
+ 1.1354954242706299,
653
+ 1.202142357826233,
654
+ 1.1697142124176025,
655
+ 1.216151237487793,
656
+ 0.9472143054008484,
657
+ 1.0352338552474976,
658
+ 1.2005023956298828,
659
+ 0.9383926391601562,
660
+ 0.9692818522453308,
661
+ 0.8716940879821777,
662
+ 0.9582070112228394,
663
+ 1.061899185180664,
664
+ 0.9574461579322815,
665
+ 1.0999226570129395,
666
+ 0.8257886171340942,
667
+ 0.9105151891708374,
668
+ 0.7686405181884766,
669
+ 0.7620456218719482,
670
+ 0.8083024621009827,
671
+ 0.7366126775741577,
672
+ 0.64865642786026,
673
+ 0.6970773935317993,
674
+ 0.5407489538192749,
675
+ 0.9302119016647339,
676
+ 0.6019563674926758,
677
+ 0.6286913156509399,
678
+ 0.6697531938552856,
679
+ 0.85337895154953,
680
+ 0.605627715587616,
681
+ 0.6994856595993042,
682
+ 0.6913561820983887,
683
+ 0.7227469086647034,
684
+ 0.8089389204978943,
685
+ 0.679562509059906,
686
+ 0.5462037324905396,
687
+ 0.5866653919219971,
688
+ 0.48199528455734253,
689
+ 0.49292898178100586,
690
+ 0.5071792602539062,
691
+ 0.6359560489654541,
692
+ 0.4345041811466217,
693
+ 0.5750279426574707,
694
+ 0.5141332149505615,
695
+ 0.48265522718429565,
696
+ 0.38371920585632324,
697
+ 0.6727322936058044,
698
+ 0.524191677570343,
699
+ 0.46154582500457764,
700
+ 0.38243192434310913,
701
+ 0.5157103538513184,
702
+ 0.48300936818122864,
703
+ 0.5282471179962158,
704
+ 0.47535738348960876,
705
+ 0.4935920834541321,
706
+ 0.4585495889186859,
707
+ 0.4682696759700775,
708
+ 0.3801548182964325,
709
+ 0.3888419568538666,
710
+ 0.314349889755249,
711
+ 0.40311598777770996,
712
+ 0.393927663564682,
713
+ 0.3618808388710022,
714
+ 0.31192538142204285,
715
+ 0.29459425806999207,
716
+ 0.38845521211624146,
717
+ 0.3338332772254944,
718
+ 0.45690685510635376,
719
+ 0.2870320677757263,
720
+ 0.30454182624816895,
721
+ 0.39305591583251953,
722
+ 0.4107697606086731,
723
+ 0.2857040762901306,
724
+ 0.40057629346847534,
725
+ 0.2520090937614441,
726
+ 0.3365999460220337,
727
+ 0.3793593645095825,
728
+ 0.2781757414340973,
729
+ 0.23415732383728027,
730
+ 0.17023888230323792,
731
+ 0.236487478017807,
732
+ 0.29216936230659485,
733
+ 0.18099826574325562,
734
+ 0.28724172711372375,
735
+ 0.15562580525875092,
736
+ 0.24116644263267517,
737
+ 0.29714399576187134,
738
+ 0.23464536666870117,
739
+ 0.25069287419319153,
740
+ 0.24226970970630646,
741
+ 0.27992311120033264,
742
+ 0.286587655544281,
743
+ 0.17398861050605774,
744
+ 0.28588318824768066,
745
+ 0.2069043666124344,
746
+ 0.18253867328166962,
747
+ 0.24283462762832642,
748
+ 0.26914891600608826,
749
+ 0.22705870866775513,
750
+ 0.1970517933368683,
751
+ 0.17965485155582428,
752
+ 0.2492925226688385,
753
+ 0.1700528860092163,
754
+ 0.16555199027061462,
755
+ 0.22087526321411133,
756
+ 0.22362147271633148,
757
+ 0.23984941840171814,
758
+ 0.23964354395866394,
759
+ 0.17572689056396484,
760
+ 0.18303079903125763,
761
+ 0.20619693398475647
762
  ],
763
  "zipf_loss": [
764
+ 5.992541313171387,
765
+ 4.256757736206055,
766
+ 2.3342857360839844,
767
+ 1.142124891281128,
768
+ 0.7460483908653259,
769
+ 0.6850723028182983,
770
+ 0.6697337031364441,
771
+ 0.6657452583312988,
772
+ 0.6604452133178711,
773
+ 0.6608524918556213,
774
+ 0.6651840209960938,
775
+ 0.6654003262519836,
776
+ 0.6609048247337341,
777
+ 0.6551106572151184,
778
+ 0.6510313749313354,
779
+ 0.6086770296096802,
780
+ 0.502957820892334,
781
+ 0.39937275648117065,
782
+ 0.3074512779712677,
783
+ 0.25372886657714844,
784
+ 0.22332003712654114,
785
+ 0.20783749222755432,
786
+ 0.2116575390100479,
787
+ 0.17998555302619934,
788
+ 0.1737050563097,
789
+ 0.1659075915813446,
790
+ 0.16389304399490356,
791
+ 0.15481875836849213,
792
+ 0.14997941255569458,
793
+ 0.14742501080036163,
794
+ 0.13379204273223877,
795
+ 0.1261483132839203,
796
+ 0.1256428062915802,
797
+ 0.12281343340873718,
798
+ 0.1190091073513031,
799
+ 0.11422161012887955,
800
+ 0.10806499421596527,
801
+ 0.1024467945098877,
802
+ 0.1175742894411087,
803
+ 0.10470254719257355,
804
+ 0.09950097650289536,
805
+ 0.09661951661109924,
806
+ 0.08176100254058838,
807
+ 0.09228333085775375,
808
+ 0.0832676887512207,
809
+ 0.08387405425310135,
810
+ 0.07440327852964401,
811
+ 0.09880977869033813,
812
+ 0.07880298793315887,
813
+ 0.07589824497699738,
814
+ 0.07264722883701324,
815
+ 0.05839239060878754,
816
+ 0.057406291365623474,
817
+ 0.051846496760845184,
818
+ 0.06693202257156372,
819
+ 0.051612261682748795,
820
+ 0.055289462208747864,
821
+ 0.07129812985658646,
822
+ 0.04794581979513168,
823
+ 0.06939932703971863,
824
+ 0.05468002334237099,
825
+ 0.057209789752960205,
826
+ 0.0639333575963974,
827
+ 0.03705426678061485,
828
+ 0.05057953670620918,
829
+ 0.04965557903051376,
830
+ 0.04756723344326019,
831
+ 0.030643729493021965,
832
+ 0.043815724551677704,
833
+ 0.04578302800655365,
834
+ 0.05483042076230049,
835
+ 0.03150896355509758,
836
+ 0.028118720278143883,
837
+ 0.04513361677527428,
838
+ 0.028530914336442947,
839
+ 0.034275688230991364,
840
+ 0.04149279743432999,
841
+ 0.04125683009624481,
842
+ 0.04158829152584076,
843
+ 0.03704618662595749,
844
+ 0.034520722925662994,
845
+ 0.023296881467103958,
846
+ 0.030839255079627037,
847
+ 0.042560875415802,
848
+ 0.04106279835104942,
849
+ 0.019770771265029907,
850
+ 0.01801365055143833,
851
+ 0.023459654301404953,
852
+ 0.03903378173708916,
853
+ 0.03520215302705765,
854
+ 0.02873474918305874,
855
+ 0.02199714072048664,
856
+ 0.03557206690311432,
857
+ 0.042527176439762115,
858
+ 0.03995896130800247,
859
+ 0.042615462094545364,
860
+ 0.05649139732122421,
861
+ 0.04118660092353821,
862
+ 0.0336117222905159,
863
+ 0.06539583206176758,
864
+ 0.05143829807639122,
865
+ 0.03835456073284149,
866
+ 0.03905396908521652,
867
+ 0.03247641399502754,
868
+ 0.038659460842609406,
869
+ 0.02400336042046547,
870
+ 0.028478197753429413,
871
+ 0.03173477202653885,
872
+ 0.023022141307592392,
873
+ 0.024034500122070312,
874
+ 0.03353904187679291,
875
+ 0.029786277562379837,
876
+ 0.02293926477432251,
877
+ 0.05721593275666237,
878
+ 0.02410007268190384,
879
+ 0.02435165084898472,
880
+ 0.02972968854010105,
881
+ 0.03335817903280258,
882
+ 0.0289214625954628,
883
+ 0.030072137713432312,
884
+ 0.044025976210832596,
885
+ 0.05235940217971802,
886
+ 0.027709070593118668,
887
+ 0.04703980311751366,
888
+ 0.03810810297727585,
889
+ 0.03297300264239311,
890
+ 0.024960467591881752,
891
+ 0.03001183271408081,
892
+ 0.04660506919026375,
893
+ 0.030839864164590836,
894
+ 0.02685823291540146,
895
+ 0.03118157386779785,
896
+ 0.043957799673080444,
897
+ 0.04862763732671738,
898
+ 0.03027738630771637,
899
+ 0.04692744463682175,
900
+ 0.031047239899635315,
901
+ 0.02710168994963169,
902
+ 0.028775956481695175,
903
+ 0.03928530216217041,
904
+ 0.04044933617115021,
905
+ 0.03240543231368065,
906
+ 0.039550866931676865,
907
+ 0.022889159619808197,
908
+ 0.023003853857517242,
909
+ 0.031042777001857758,
910
+ 0.02698989398777485,
911
+ 0.04021558538079262,
912
+ 0.04178132116794586,
913
+ 0.023517422378063202
914
  ],
915
  "denoise_loss": [],
916
  "ortho_loss": [
917
+ 0.6933014988899231,
918
+ 0.37083250284194946,
919
+ 0.16746486723423004,
920
+ 0.0885070413351059,
921
+ 0.06592030823230743,
922
+ 0.053648799657821655,
923
+ 0.04771490767598152,
924
+ 0.04534199461340904,
925
+ 0.0437336266040802,
926
+ 0.045895759016275406,
927
+ 0.05053376406431198,
928
+ 0.0523027703166008,
929
+ 0.05737421289086342,
930
+ 0.061693500727415085,
931
+ 0.06343631446361542,
932
+ 0.06562791019678116,
933
+ 0.06717279553413391,
934
+ 0.07206566631793976,
935
+ 0.07831596583127975,
936
+ 0.07906866073608398,
937
+ 0.08471731096506119,
938
+ 0.09428071230649948,
939
+ 0.10492909699678421,
940
+ 0.11721401661634445,
941
+ 0.12516844272613525,
942
+ 0.1334349811077118,
943
+ 0.14114034175872803,
944
+ 0.1503930687904358,
945
+ 0.15645001828670502,
946
+ 0.16175302863121033,
947
+ 0.1684732288122177,
948
+ 0.16980968415737152,
949
+ 0.1736874133348465,
950
+ 0.17783427238464355,
951
+ 0.18060865998268127,
952
+ 0.18240122497081757,
953
+ 0.1839177906513214,
954
+ 0.18623745441436768,
955
+ 0.1907666027545929,
956
+ 0.19191065430641174,
957
+ 0.19565843045711517,
958
+ 0.19815172255039215,
959
+ 0.20228537917137146,
960
+ 0.20597098767757416,
961
+ 0.2075631469488144,
962
+ 0.20883804559707642,
963
+ 0.2080991268157959,
964
+ 0.21085670590400696,
965
+ 0.21062801778316498,
966
+ 0.2116369903087616,
967
+ 0.2120591253042221,
968
+ 0.21061359345912933,
969
+ 0.20848363637924194,
970
+ 0.20663155615329742,
971
+ 0.2056088000535965,
972
+ 0.20723474025726318,
973
+ 0.2063807100057602,
974
+ 0.20915858447551727,
975
+ 0.20919714868068695,
976
+ 0.20870265364646912,
977
+ 0.2069307267665863,
978
+ 0.20666652917861938,
979
+ 0.2061752825975418,
980
+ 0.2027379870414734,
981
+ 0.20436672866344452,
982
+ 0.20579716563224792,
983
+ 0.20884613692760468,
984
+ 0.21337348222732544,
985
+ 0.21834859251976013,
986
+ 0.21869564056396484,
987
+ 0.2199230194091797,
988
+ 0.22768796980381012,
989
+ 0.23089125752449036,
990
+ 0.23446932435035706,
991
+ 0.23750188946723938,
992
+ 0.2428743839263916,
993
+ 0.2425122857093811,
994
+ 0.24684441089630127,
995
+ 0.24865762889385223,
996
+ 0.24414007365703583,
997
+ 0.2449251115322113,
998
+ 0.24844960868358612,
999
+ 0.2532559931278229,
1000
+ 0.2549189329147339,
1001
+ 0.25830599665641785,
1002
+ 0.256623238325119,
1003
+ 0.25953999161720276,
1004
+ 0.2646258771419525,
1005
+ 0.26612550020217896,
1006
+ 0.26787811517715454,
1007
+ 0.2701391279697418,
1008
+ 0.27274689078330994,
1009
+ 0.274588942527771,
1010
+ 0.27538907527923584,
1011
+ 0.27801740169525146,
1012
+ 0.2798006534576416,
1013
+ 0.27908483147621155,
1014
+ 0.2781679928302765,
1015
+ 0.28107044100761414,
1016
+ 0.2800515592098236,
1017
+ 0.28154537081718445,
1018
+ 0.2851882874965668,
1019
+ 0.29015690088272095,
1020
+ 0.2916761636734009,
1021
+ 0.29237350821495056,
1022
+ 0.29165220260620117,
1023
+ 0.295254647731781,
1024
+ 0.29890671372413635,
1025
+ 0.30145129561424255,
1026
+ 0.3019912540912628,
1027
+ 0.30194753408432007,
1028
+ 0.3042812943458557,
1029
+ 0.30524149537086487,
1030
+ 0.3049549162387848,
1031
+ 0.3069272041320801,
1032
+ 0.30974724888801575,
1033
+ 0.31134963035583496,
1034
+ 0.31236183643341064,
1035
+ 0.3140103220939636,
1036
+ 0.3156379163265228,
1037
+ 0.3186745047569275,
1038
+ 0.31933704018592834,
1039
+ 0.3208130896091461,
1040
+ 0.3216458857059479,
1041
+ 0.32485339045524597,
1042
+ 0.3259000778198242,
1043
+ 0.3260437250137329,
1044
+ 0.32846739888191223,
1045
+ 0.3293222486972809,
1046
+ 0.33021095395088196,
1047
+ 0.33130118250846863,
1048
+ 0.33234986662864685,
1049
+ 0.3325884938240051,
1050
+ 0.33358755707740784,
1051
+ 0.3331451416015625,
1052
+ 0.33463388681411743,
1053
+ 0.33540332317352295,
1054
+ 0.3352293372154236,
1055
+ 0.3365360498428345,
1056
+ 0.33647823333740234,
1057
+ 0.3373063802719116,
1058
+ 0.3373261094093323,
1059
+ 0.3375466763973236,
1060
+ 0.33824118971824646,
1061
+ 0.3386029601097107,
1062
+ 0.33914104104042053,
1063
+ 0.3400459289550781,
1064
+ 0.3409873843193054,
1065
+ 0.3414129614830017,
1066
+ 0.3418258726596832
1067
  ],
1068
  "lr": [
1069
+ 8.376068376068378e-06,
1070
+ 1.6923076923076924e-05,
1071
+ 2.5470085470085475e-05,
1072
+ 3.401709401709402e-05,
1073
+ 4e-05,
1074
+ 4e-05,
1075
+ 4e-05,
1076
+ 4e-05,
1077
+ 4e-05,
1078
+ 4e-05,
1079
+ 4e-05,
1080
+ 4e-05,
1081
+ 4e-05,
1082
+ 4e-05,
1083
+ 4e-05,
1084
+ 4e-05,
1085
+ 4e-05,
1086
+ 4e-05,
1087
+ 4e-05,
1088
+ 4e-05,
1089
+ 4e-05,
1090
+ 4e-05,
1091
+ 4e-05,
1092
+ 4e-05,
1093
+ 4e-05,
1094
+ 4e-05,
1095
+ 4e-05,
1096
+ 4e-05,
1097
+ 4e-05,
1098
+ 4e-05,
1099
+ 4e-05,
1100
+ 4e-05,
1101
+ 4e-05,
1102
+ 4e-05,
1103
+ 4e-05,
1104
+ 4e-05,
1105
+ 4e-05,
1106
+ 4e-05,
1107
+ 4e-05,
1108
+ 4e-05,
1109
+ 4e-05,
1110
+ 4e-05,
1111
+ 4e-05,
1112
+ 4e-05,
1113
+ 4e-05,
1114
+ 4e-05,
1115
+ 4e-05,
1116
+ 4e-05,
1117
+ 4e-05,
1118
+ 4e-05,
1119
+ 4e-05,
1120
+ 4e-05,
1121
+ 4e-05,
1122
+ 4e-05,
1123
+ 4e-05,
1124
+ 4e-05,
1125
+ 4e-05,
1126
+ 4e-05,
1127
+ 4e-05,
1128
+ 4e-05,
1129
+ 4e-05,
1130
+ 4e-05,
1131
+ 4e-05,
1132
+ 4e-05,
1133
+ 4e-05,
1134
+ 4e-05,
1135
+ 4e-05,
1136
+ 4e-05,
1137
+ 4e-05,
1138
+ 4e-05,
1139
+ 4e-05,
1140
+ 4e-05,
1141
+ 4e-05,
1142
+ 4e-05,
1143
+ 4e-05,
1144
+ 4e-05,
1145
+ 4e-05,
1146
+ 4e-05,
1147
+ 4e-05,
1148
+ 4e-05,
1149
+ 4e-05,
1150
+ 4e-05,
1151
+ 4e-05,
1152
+ 4e-05,
1153
+ 4e-05,
1154
+ 4e-05,
1155
+ 4e-05,
1156
+ 4e-05,
1157
+ 4e-05,
1158
+ 4e-05,
1159
+ 4e-05,
1160
+ 3.993593461639863e-05,
1161
+ 3.934273662008964e-05,
1162
+ 3.874953862378065e-05,
1163
+ 3.815634062747166e-05,
1164
+ 3.7563142631162665e-05,
1165
+ 3.696994463485368e-05,
1166
+ 3.637674663854469e-05,
1167
+ 3.5783548642235693e-05,
1168
+ 3.519035064592671e-05,
1169
+ 3.459715264961771e-05,
1170
+ 3.400395465330873e-05,
1171
+ 3.341075665699973e-05,
1172
+ 3.281755866069075e-05,
1173
+ 3.2224360664381764e-05,
1174
+ 3.1251515950435014e-05,
1175
+ 3.065831795412602e-05,
1176
+ 3.0065119957817037e-05,
1177
+ 2.947192196150804e-05,
1178
+ 2.887872396519905e-05,
1179
+ 2.8285525968890065e-05,
1180
+ 2.769232797258107e-05,
1181
+ 2.709912997627208e-05,
1182
+ 2.6505931979963087e-05,
1183
+ 2.5912733983654104e-05,
1184
+ 2.5319535987345117e-05,
1185
+ 2.472633799103612e-05,
1186
+ 2.4133139994727132e-05,
1187
+ 2.3539941998418135e-05,
1188
+ 2.2946744002109148e-05,
1189
+ 2.1973899288162408e-05,
1190
+ 2.138070129185341e-05,
1191
+ 2.0787503295544424e-05,
1192
+ 2.019430529923544e-05,
1193
+ 1.9601107302926443e-05,
1194
+ 1.900790930661746e-05,
1195
+ 1.8414711310308462e-05,
1196
+ 1.7821513313999475e-05,
1197
+ 1.7228315317690488e-05,
1198
+ 1.663511732138149e-05,
1199
+ 1.6041919325072507e-05,
1200
+ 1.544872132876351e-05,
1201
+ 1.4855523332454524e-05,
1202
+ 1.4262325336145537e-05,
1203
+ 1.366912733983654e-05,
1204
+ 1.2696282625889797e-05,
1205
+ 1.2103084629580812e-05,
1206
+ 1.1509886633271816e-05,
1207
+ 1.0916688636962829e-05,
1208
+ 1.0323490640653833e-05,
1209
+ 9.730292644344846e-06,
1210
+ 9.137094648035861e-06,
1211
+ 8.543896651726864e-06,
1212
+ 7.950698655417878e-06,
1213
+ 7.357500659108881e-06,
1214
+ 6.764302662799895e-06,
1215
+ 6.171104666490909e-06,
1216
+ 5.577906670181913e-06,
1217
+ 4.984708673872927e-06,
1218
+ 4.391510677563931e-06
1219
  ],
1220
  "emb_lr": [],
1221
  "eval_step": [
 
1231
  7788
1232
  ],
1233
  "eval_accuracy": [
1234
+ 0.0,
1235
+ 0.18,
1236
+ 0.74,
1237
+ 0.94,
1238
+ 0.99,
1239
  0.95,
1240
  0.99,
1241
  1.0,
1242
+ 0.99,
 
 
 
1243
  1.0
1244
  ]
1245
  },
1246
+ "final_accuracy": 0.9983333333333333,
1247
  "sft_eval": {
1248
  "config": {
1249
  "ops": "add_sub",
1250
  "K": null,
1251
  "mode": "sft",
1252
  "n_digits": 6,
1253
+ "n_per_split": 100
1254
  },
1255
  "splits": {
1256
  "add_S0": {
1257
+ "full_accuracy": 0.98,
1258
+ "n_examples": 100,
1259
  "per_subtask": {
1260
  "SA": {
1261
+ "accuracy": 0.9983471074380166,
1262
+ "count": 605
1263
  },
1264
  "SS": {
1265
+ "accuracy": 0.9894736842105263,
1266
+ "count": 95
1267
  }
1268
  }
1269
  },
1270
  "add_S1": {
1271
+ "full_accuracy": 0.98,
1272
+ "n_examples": 100,
1273
  "per_subtask": {
1274
  "SA": {
1275
+ "accuracy": 0.9950980392156863,
1276
+ "count": 204
1277
  },
1278
  "SC": {
1279
+ "accuracy": 0.9940828402366864,
1280
+ "count": 169
1281
  },
1282
  "SS": {
1283
  "accuracy": 1.0,
1284
+ "count": 31
1285
  },
1286
  "UC": {
1287
+ "accuracy": 1.0,
1288
+ "count": 296
1289
  }
1290
  }
1291
  },
1292
  "add_S2": {
1293
+ "full_accuracy": 0.96,
1294
+ "n_examples": 100,
1295
  "per_subtask": {
1296
  "SA": {
1297
+ "accuracy": 1.0,
1298
+ "count": 163
1299
  },
1300
  "SC": {
1301
+ "accuracy": 0.9769230769230769,
1302
+ "count": 130
1303
  },
1304
  "SS": {
1305
+ "accuracy": 0.9770114942528736,
1306
+ "count": 87
1307
  },
1308
  "UC": {
1309
+ "accuracy": 1.0,
1310
+ "count": 203
1311
  },
1312
  "US": {
1313
+ "accuracy": 1.0,
1314
+ "count": 117
1315
  }
1316
  }
1317
  },
1318
  "add_S3": {
1319
+ "full_accuracy": 0.76,
1320
+ "n_examples": 100,
1321
  "per_subtask": {
1322
  "SA": {
1323
+ "accuracy": 1.0,
1324
+ "count": 121
1325
  },
1326
  "SC": {
1327
+ "accuracy": 1.0,
1328
+ "count": 121
1329
  },
1330
  "SS": {
1331
  "accuracy": 1.0,
1332
+ "count": 49
1333
  },
1334
  "UC": {
1335
+ "accuracy": 0.8709677419354839,
1336
+ "count": 186
1337
  },
1338
  "US": {
1339
+ "accuracy": 1.0,
1340
+ "count": 223
1341
  }
1342
  }
1343
  },
1344
  "add_S4": {
1345
+ "full_accuracy": 0.55,
1346
+ "n_examples": 100,
1347
  "per_subtask": {
1348
  "SA": {
1349
  "accuracy": 1.0,
1350
+ "count": 104
1351
  },
1352
  "SC": {
1353
+ "accuracy": 1.0,
1354
+ "count": 106
1355
  },
1356
  "SS": {
1357
+ "accuracy": 1.0,
1358
+ "count": 23
1359
  },
1360
  "UC": {
1361
+ "accuracy": 0.8,
1362
+ "count": 160
1363
  },
1364
  "US": {
1365
+ "accuracy": 0.9022801302931596,
1366
+ "count": 307
1367
  }
1368
  }
1369
  },
1370
  "add_S5": {
1371
+ "full_accuracy": 0.32,
1372
+ "n_examples": 100,
1373
  "per_subtask": {
1374
  "SA": {
1375
  "accuracy": 1.0,
1376
+ "count": 100
1377
  },
1378
  "SC": {
1379
+ "accuracy": 1.0,
1380
+ "count": 100
1381
  },
1382
  "UC": {
1383
+ "accuracy": 0.49,
1384
+ "count": 100
1385
  },
1386
  "US": {
1387
+ "accuracy": 0.6975,
1388
+ "count": 400
1389
  }
1390
  }
1391
  },
1392
  "add_S6": {
1393
+ "full_accuracy": 0.61,
1394
+ "n_examples": 100,
1395
  "per_subtask": {
1396
  "SC": {
1397
  "accuracy": 1.0,
1398
+ "count": 100
1399
  },
1400
  "UC": {
1401
+ "accuracy": 0.67,
1402
+ "count": 100
1403
  },
1404
  "US": {
1405
+ "accuracy": 0.782,
1406
+ "count": 500
1407
  }
1408
  }
1409
  },
1410
  "add_random": {
1411
+ "full_accuracy": 0.975,
1412
  "n_examples": 200,
1413
  "per_subtask": {
1414
  "SA": {
1415
+ "accuracy": 1.0,
1416
+ "count": 447
1417
  },
1418
  "SC": {
1419
+ "accuracy": 0.996875,
1420
+ "count": 320
1421
  },
1422
  "SS": {
1423
+ "accuracy": 1.0,
1424
+ "count": 56
1425
  },
1426
  "UC": {
1427
+ "accuracy": 0.9924385633270322,
1428
+ "count": 529
1429
  },
1430
  "US": {
1431
+ "accuracy": 1.0,
1432
+ "count": 48
1433
  }
1434
  }
1435
  },
1436
  "add_C3": {
1437
+ "full_accuracy": 0.83,
1438
+ "n_examples": 100,
1439
  "per_subtask": {
1440
  "SA": {
1441
  "accuracy": 1.0,
1442
+ "count": 300
1443
  },
1444
  "SC": {
1445
  "accuracy": 1.0,
1446
+ "count": 100
1447
  },
1448
  "UC": {
1449
+ "accuracy": 0.9119170984455959,
1450
+ "count": 193
1451
  },
1452
  "US": {
1453
+ "accuracy": 0.9626168224299065,
1454
+ "count": 107
1455
  }
1456
  }
1457
  },
1458
  "add_C4": {
1459
+ "full_accuracy": 0.8,
1460
+ "n_examples": 100,
1461
  "per_subtask": {
1462
  "SA": {
1463
+ "accuracy": 1.0,
1464
+ "count": 200
1465
  },
1466
  "SC": {
1467
  "accuracy": 1.0,
1468
+ "count": 100
1469
  },
1470
  "UC": {
1471
+ "accuracy": 0.92578125,
1472
+ "count": 256
1473
  },
1474
  "US": {
1475
+ "accuracy": 0.9513888888888888,
1476
+ "count": 144
1477
  }
1478
  }
1479
  },
1480
  "add_C5": {
1481
+ "full_accuracy": 0.84,
1482
+ "n_examples": 100,
1483
  "per_subtask": {
1484
  "SA": {
1485
  "accuracy": 1.0,
1486
+ "count": 100
1487
  },
1488
  "SC": {
1489
+ "accuracy": 1.0,
1490
+ "count": 100
1491
  },
1492
  "UC": {
1493
+ "accuracy": 0.9575163398692811,
1494
+ "count": 306
1495
  },
1496
  "US": {
1497
+ "accuracy": 0.9639175257731959,
1498
+ "count": 194
1499
  }
1500
  }
1501
  },
1502
  "add_C6": {
1503
+ "full_accuracy": 0.8,
1504
+ "n_examples": 100,
1505
  "per_subtask": {
1506
  "SC": {
1507
  "accuracy": 1.0,
1508
+ "count": 100
1509
  },
1510
  "UC": {
1511
+ "accuracy": 0.9480874316939891,
1512
+ "count": 366
1513
  },
1514
  "US": {
1515
+ "accuracy": 0.9914529914529915,
1516
+ "count": 234
1517
  }
1518
  }
1519
  },
1520
  "sub_M0": {
1521
+ "full_accuracy": 0.97,
1522
+ "n_examples": 100,
1523
  "per_subtask": {
1524
  "MD": {
1525
+ "accuracy": 0.9950083194675541,
1526
+ "count": 601
1527
  },
1528
  "ME": {
1529
  "accuracy": 1.0,
1530
+ "count": 99
1531
  }
1532
  }
1533
  },
1534
  "sub_M1": {
1535
+ "full_accuracy": 0.98,
1536
+ "n_examples": 100,
1537
  "per_subtask": {
1538
  "MD": {
1539
+ "accuracy": 0.996415770609319,
1540
+ "count": 279
1541
  },
1542
  "MB": {
1543
+ "accuracy": 0.993103448275862,
1544
+ "count": 145
1545
  },
1546
  "ME": {
1547
  "accuracy": 1.0,
1548
+ "count": 24
1549
  },
1550
  "UB": {
1551
+ "accuracy": 1.0,
1552
+ "count": 252
1553
  }
1554
  }
1555
  },
1556
  "sub_M2": {
1557
+ "full_accuracy": 1.0,
1558
+ "n_examples": 100,
1559
  "per_subtask": {
1560
  "MD": {
1561
+ "accuracy": 1.0,
1562
+ "count": 213
1563
  },
1564
  "MB": {
1565
  "accuracy": 1.0,
1566
+ "count": 113
1567
  },
1568
  "ME": {
1569
+ "accuracy": 1.0,
1570
+ "count": 85
1571
  },
1572
  "UB": {
1573
+ "accuracy": 1.0,
1574
+ "count": 181
1575
  },
1576
  "UD": {
1577
  "accuracy": 1.0,
1578
+ "count": 108
1579
  }
1580
  }
1581
  },
1582
  "sub_M3": {
1583
+ "full_accuracy": 0.54,
1584
+ "n_examples": 100,
1585
  "per_subtask": {
1586
  "MD": {
1587
+ "accuracy": 1.0,
1588
+ "count": 179
1589
  },
1590
  "MB": {
1591
+ "accuracy": 1.0,
1592
+ "count": 103
1593
  },
1594
  "ME": {
1595
  "accuracy": 1.0,
1596
+ "count": 56
1597
  },
1598
  "UB": {
1599
+ "accuracy": 0.6912751677852349,
1600
+ "count": 149
1601
  },
1602
  "UD": {
1603
+ "accuracy": 1.0,
1604
+ "count": 213
1605
  }
1606
  }
1607
  },
1608
  "sub_M4": {
1609
+ "full_accuracy": 0.16,
1610
+ "n_examples": 100,
1611
  "per_subtask": {
1612
  "MD": {
1613
+ "accuracy": 1.0,
1614
+ "count": 200
1615
  },
1616
  "MB": {
1617
  "accuracy": 1.0,
1618
+ "count": 100
1619
  },
1620
  "UB": {
1621
+ "accuracy": 0.38,
1622
+ "count": 100
1623
  },
1624
  "UD": {
1625
+ "accuracy": 0.7733333333333333,
1626
+ "count": 300
1627
  }
1628
  }
1629
  },
1630
  "sub_M5": {
1631
+ "full_accuracy": 0.02,
1632
+ "n_examples": 100,
1633
  "per_subtask": {
1634
  "MD": {
1635
  "accuracy": 1.0,
1636
+ "count": 100
1637
  },
1638
  "MB": {
1639
  "accuracy": 1.0,
1640
+ "count": 100
1641
  },
1642
  "UB": {
1643
+ "accuracy": 0.28,
1644
+ "count": 100
1645
  },
1646
  "UD": {
1647
+ "accuracy": 0.5325,
1648
+ "count": 400
1649
  }
1650
  }
1651
  },
1652
  "sub_random": {
1653
+ "full_accuracy": 0.985,
1654
  "n_examples": 200,
1655
  "per_subtask": {
1656
  "MD": {
1657
+ "accuracy": 0.9983333333333333,
1658
+ "count": 600
1659
  },
1660
  "MB": {
1661
+ "accuracy": 0.9962546816479401,
1662
+ "count": 267
1663
  },
1664
  "ME": {
1665
  "accuracy": 1.0,
1666
+ "count": 53
1667
  },
1668
  "UB": {
1669
+ "accuracy": 0.9977220956719818,
1670
+ "count": 439
1671
  },
1672
  "UD": {
1673
+ "accuracy": 1.0,
1674
+ "count": 41
1675
  }
1676
  }
1677
  },
1678
  "sub_B3": {
1679
+ "full_accuracy": 0.94,
1680
+ "n_examples": 100,
1681
  "per_subtask": {
1682
  "MD": {
1683
+ "accuracy": 1.0,
1684
+ "count": 300
1685
  },
1686
  "MB": {
1687
  "accuracy": 1.0,
1688
+ "count": 100
1689
  },
1690
  "UB": {
1691
+ "accuracy": 0.9695431472081218,
1692
+ "count": 197
1693
  },
1694
  "UD": {
1695
+ "accuracy": 1.0,
1696
+ "count": 103
1697
  }
1698
  }
1699
  },
1700
  "sub_B4": {
1701
+ "full_accuracy": 0.73,
1702
+ "n_examples": 100,
1703
  "per_subtask": {
1704
  "MD": {
1705
  "accuracy": 1.0,
1706
+ "count": 200
1707
  },
1708
  "MB": {
1709
  "accuracy": 1.0,
1710
+ "count": 100
1711
  },
1712
  "UB": {
1713
+ "accuracy": 0.8906882591093117,
1714
+ "count": 247
1715
  },
1716
  "UD": {
1717
+ "accuracy": 0.9477124183006536,
1718
+ "count": 153
1719
  }
1720
  }
1721
  },
1722
  "sub_B5": {
1723
+ "full_accuracy": 0.69,
1724
+ "n_examples": 100,
1725
  "per_subtask": {
1726
  "MD": {
1727
  "accuracy": 1.0,
1728
+ "count": 100
1729
  },
1730
  "MB": {
1731
  "accuracy": 1.0,
1732
+ "count": 100
1733
  },
1734
  "UB": {
1735
+ "accuracy": 0.9194630872483222,
1736
+ "count": 298
1737
  },
1738
  "UD": {
1739
+ "accuracy": 0.8960396039603961,
1740
+ "count": 202
1741
  }
1742
  }
1743
  }
1744
  },
1745
  "summary": {
1746
+ "overall_accuracy": 0.7658333333333334,
1747
+ "total_examples": 2400,
1748
  "n_splits": 22
1749
  }
1750
  },
 
1754
  "K": 4,
1755
  "mode": "sorl",
1756
  "n_digits": 6,
1757
+ "n_per_split": 100
1758
  },
1759
  "splits": {
1760
  "add_S0": {
1761
  "full_accuracy": 1.0,
1762
+ "n_examples": 100,
1763
  "per_subtask": {
1764
  "SA": {
1765
  "accuracy": 1.0,
1766
+ "count": 605
1767
  },
1768
  "SS": {
1769
  "accuracy": 1.0,
1770
+ "count": 95
1771
  }
1772
  }
1773
  },
1774
  "add_S1": {
1775
  "full_accuracy": 1.0,
1776
+ "n_examples": 100,
1777
  "per_subtask": {
1778
  "SA": {
1779
  "accuracy": 1.0,
1780
+ "count": 204
1781
  },
1782
  "SC": {
1783
  "accuracy": 1.0,
1784
+ "count": 169
1785
  },
1786
  "SS": {
1787
  "accuracy": 1.0,
1788
+ "count": 31
1789
  },
1790
  "UC": {
1791
  "accuracy": 1.0,
1792
+ "count": 296
1793
  }
1794
  }
1795
  },
1796
  "add_S2": {
1797
  "full_accuracy": 1.0,
1798
+ "n_examples": 100,
1799
  "per_subtask": {
1800
  "SA": {
1801
  "accuracy": 1.0,
1802
+ "count": 163
1803
  },
1804
  "SC": {
1805
  "accuracy": 1.0,
1806
+ "count": 130
1807
  },
1808
  "SS": {
1809
  "accuracy": 1.0,
1810
+ "count": 87
1811
  },
1812
  "UC": {
1813
  "accuracy": 1.0,
1814
+ "count": 203
1815
  },
1816
  "US": {
1817
  "accuracy": 1.0,
1818
+ "count": 117
1819
  }
1820
  }
1821
  },
1822
  "add_S3": {
1823
  "full_accuracy": 1.0,
1824
+ "n_examples": 100,
1825
  "per_subtask": {
1826
  "SA": {
1827
  "accuracy": 1.0,
1828
+ "count": 121
1829
  },
1830
  "SC": {
1831
  "accuracy": 1.0,
1832
+ "count": 121
1833
  },
1834
  "SS": {
1835
  "accuracy": 1.0,
1836
+ "count": 49
1837
  },
1838
  "UC": {
1839
  "accuracy": 1.0,
1840
+ "count": 186
1841
  },
1842
  "US": {
1843
  "accuracy": 1.0,
1844
+ "count": 223
1845
  }
1846
  }
1847
  },
1848
  "add_S4": {
1849
  "full_accuracy": 1.0,
1850
+ "n_examples": 100,
1851
  "per_subtask": {
1852
  "SA": {
1853
  "accuracy": 1.0,
1854
+ "count": 104
1855
  },
1856
  "SC": {
1857
  "accuracy": 1.0,
1858
+ "count": 106
1859
  },
1860
  "SS": {
1861
  "accuracy": 1.0,
1862
+ "count": 23
1863
  },
1864
  "UC": {
1865
  "accuracy": 1.0,
1866
+ "count": 160
1867
  },
1868
  "US": {
1869
  "accuracy": 1.0,
1870
+ "count": 307
1871
  }
1872
  }
1873
  },
1874
  "add_S5": {
1875
+ "full_accuracy": 0.99,
1876
+ "n_examples": 100,
1877
  "per_subtask": {
1878
  "SA": {
1879
  "accuracy": 1.0,
1880
+ "count": 100
1881
  },
1882
  "SC": {
1883
  "accuracy": 1.0,
1884
+ "count": 100
1885
  },
1886
  "UC": {
1887
+ "accuracy": 0.99,
1888
+ "count": 100
1889
  },
1890
  "US": {
1891
  "accuracy": 1.0,
1892
+ "count": 400
1893
  }
1894
  }
1895
  },
1896
  "add_S6": {
1897
+ "full_accuracy": 0.99,
1898
+ "n_examples": 100,
1899
  "per_subtask": {
1900
  "SC": {
1901
  "accuracy": 1.0,
1902
+ "count": 100
1903
  },
1904
  "UC": {
1905
+ "accuracy": 0.99,
1906
+ "count": 100
1907
  },
1908
  "US": {
1909
  "accuracy": 1.0,
1910
+ "count": 500
1911
  }
1912
  }
1913
  },
 
1917
  "per_subtask": {
1918
  "SA": {
1919
  "accuracy": 1.0,
1920
+ "count": 447
1921
  },
1922
  "SC": {
1923
  "accuracy": 1.0,
1924
+ "count": 320
1925
  },
1926
  "SS": {
1927
  "accuracy": 1.0,
1928
+ "count": 56
1929
  },
1930
  "UC": {
1931
  "accuracy": 1.0,
1932
+ "count": 529
1933
  },
1934
  "US": {
1935
  "accuracy": 1.0,
1936
+ "count": 48
1937
  }
1938
  }
1939
  },
1940
  "add_C3": {
1941
  "full_accuracy": 1.0,
1942
+ "n_examples": 100,
1943
  "per_subtask": {
1944
  "SA": {
1945
  "accuracy": 1.0,
1946
+ "count": 300
1947
  },
1948
  "SC": {
1949
  "accuracy": 1.0,
1950
+ "count": 100
1951
  },
1952
  "UC": {
1953
  "accuracy": 1.0,
1954
+ "count": 193
1955
  },
1956
  "US": {
1957
  "accuracy": 1.0,
1958
+ "count": 107
1959
  }
1960
  }
1961
  },
1962
  "add_C4": {
1963
  "full_accuracy": 1.0,
1964
+ "n_examples": 100,
1965
  "per_subtask": {
1966
  "SA": {
1967
  "accuracy": 1.0,
1968
+ "count": 200
1969
  },
1970
  "SC": {
1971
  "accuracy": 1.0,
1972
+ "count": 100
1973
  },
1974
  "UC": {
1975
  "accuracy": 1.0,
1976
+ "count": 256
1977
  },
1978
  "US": {
1979
  "accuracy": 1.0,
1980
+ "count": 144
1981
  }
1982
  }
1983
  },
1984
  "add_C5": {
1985
  "full_accuracy": 1.0,
1986
+ "n_examples": 100,
1987
  "per_subtask": {
1988
  "SA": {
1989
  "accuracy": 1.0,
1990
+ "count": 100
1991
  },
1992
  "SC": {
1993
  "accuracy": 1.0,
1994
+ "count": 100
1995
  },
1996
  "UC": {
1997
  "accuracy": 1.0,
1998
+ "count": 306
1999
  },
2000
  "US": {
2001
  "accuracy": 1.0,
2002
+ "count": 194
2003
  }
2004
  }
2005
  },
2006
  "add_C6": {
2007
  "full_accuracy": 1.0,
2008
+ "n_examples": 100,
2009
  "per_subtask": {
2010
  "SC": {
2011
  "accuracy": 1.0,
2012
+ "count": 100
2013
  },
2014
  "UC": {
2015
  "accuracy": 1.0,
2016
+ "count": 366
2017
  },
2018
  "US": {
2019
  "accuracy": 1.0,
2020
+ "count": 234
2021
  }
2022
  }
2023
  },
2024
  "sub_M0": {
2025
  "full_accuracy": 1.0,
2026
+ "n_examples": 100,
2027
  "per_subtask": {
2028
  "MD": {
2029
  "accuracy": 1.0,
2030
+ "count": 601
2031
  },
2032
  "ME": {
2033
  "accuracy": 1.0,
2034
+ "count": 99
2035
  }
2036
  }
2037
  },
2038
  "sub_M1": {
2039
  "full_accuracy": 1.0,
2040
+ "n_examples": 100,
2041
  "per_subtask": {
2042
  "MD": {
2043
  "accuracy": 1.0,
2044
+ "count": 279
2045
  },
2046
  "MB": {
2047
  "accuracy": 1.0,
2048
+ "count": 145
2049
  },
2050
  "ME": {
2051
  "accuracy": 1.0,
2052
+ "count": 24
2053
  },
2054
  "UB": {
2055
  "accuracy": 1.0,
2056
+ "count": 252
2057
  }
2058
  }
2059
  },
2060
  "sub_M2": {
2061
  "full_accuracy": 1.0,
2062
+ "n_examples": 100,
2063
  "per_subtask": {
2064
  "MD": {
2065
  "accuracy": 1.0,
2066
+ "count": 213
2067
  },
2068
  "MB": {
2069
  "accuracy": 1.0,
2070
+ "count": 113
2071
  },
2072
  "ME": {
2073
  "accuracy": 1.0,
2074
+ "count": 85
2075
  },
2076
  "UB": {
2077
  "accuracy": 1.0,
2078
+ "count": 181
2079
  },
2080
  "UD": {
2081
  "accuracy": 1.0,
2082
+ "count": 108
2083
  }
2084
  }
2085
  },
2086
  "sub_M3": {
2087
  "full_accuracy": 1.0,
2088
+ "n_examples": 100,
2089
  "per_subtask": {
2090
  "MD": {
2091
  "accuracy": 1.0,
2092
+ "count": 179
2093
  },
2094
  "MB": {
2095
  "accuracy": 1.0,
2096
+ "count": 103
2097
  },
2098
  "ME": {
2099
  "accuracy": 1.0,
2100
+ "count": 56
2101
  },
2102
  "UB": {
2103
  "accuracy": 1.0,
2104
+ "count": 149
2105
  },
2106
  "UD": {
2107
  "accuracy": 1.0,
2108
+ "count": 213
2109
  }
2110
  }
2111
  },
2112
  "sub_M4": {
2113
+ "full_accuracy": 0.99,
2114
+ "n_examples": 100,
2115
  "per_subtask": {
2116
  "MD": {
2117
  "accuracy": 1.0,
2118
+ "count": 200
2119
  },
2120
  "MB": {
2121
  "accuracy": 1.0,
2122
+ "count": 100
2123
  },
2124
  "UB": {
2125
+ "accuracy": 0.99,
2126
+ "count": 100
2127
  },
2128
  "UD": {
2129
  "accuracy": 1.0,
2130
+ "count": 300
2131
  }
2132
  }
2133
  },
2134
  "sub_M5": {
2135
+ "full_accuracy": 0.99,
2136
+ "n_examples": 100,
2137
  "per_subtask": {
2138
  "MD": {
2139
  "accuracy": 1.0,
2140
+ "count": 100
2141
  },
2142
  "MB": {
2143
  "accuracy": 1.0,
2144
+ "count": 100
2145
  },
2146
  "UB": {
2147
+ "accuracy": 0.99,
2148
+ "count": 100
2149
  },
2150
  "UD": {
2151
  "accuracy": 1.0,
2152
+ "count": 400
2153
  }
2154
  }
2155
  },
 
2159
  "per_subtask": {
2160
  "MD": {
2161
  "accuracy": 1.0,
2162
+ "count": 600
2163
  },
2164
  "MB": {
2165
  "accuracy": 1.0,
2166
+ "count": 267
2167
  },
2168
  "ME": {
2169
  "accuracy": 1.0,
2170
+ "count": 53
2171
  },
2172
  "UB": {
2173
  "accuracy": 1.0,
2174
+ "count": 439
2175
  },
2176
  "UD": {
2177
  "accuracy": 1.0,
2178
+ "count": 41
2179
  }
2180
  }
2181
  },
2182
  "sub_B3": {
2183
  "full_accuracy": 1.0,
2184
+ "n_examples": 100,
2185
  "per_subtask": {
2186
  "MD": {
2187
  "accuracy": 1.0,
2188
+ "count": 300
2189
  },
2190
  "MB": {
2191
  "accuracy": 1.0,
2192
+ "count": 100
2193
  },
2194
  "UB": {
2195
  "accuracy": 1.0,
2196
+ "count": 197
2197
  },
2198
  "UD": {
2199
  "accuracy": 1.0,
2200
+ "count": 103
2201
  }
2202
  }
2203
  },
2204
  "sub_B4": {
2205
  "full_accuracy": 1.0,
2206
+ "n_examples": 100,
2207
  "per_subtask": {
2208
  "MD": {
2209
  "accuracy": 1.0,
2210
+ "count": 200
2211
  },
2212
  "MB": {
2213
  "accuracy": 1.0,
2214
+ "count": 100
2215
  },
2216
  "UB": {
2217
  "accuracy": 1.0,
2218
+ "count": 247
2219
  },
2220
  "UD": {
2221
  "accuracy": 1.0,
2222
+ "count": 153
2223
  }
2224
  }
2225
  },
2226
  "sub_B5": {
2227
  "full_accuracy": 1.0,
2228
+ "n_examples": 100,
2229
  "per_subtask": {
2230
  "MD": {
2231
  "accuracy": 1.0,
2232
+ "count": 100
2233
  },
2234
  "MB": {
2235
  "accuracy": 1.0,
2236
+ "count": 100
2237
  },
2238
  "UB": {
2239
  "accuracy": 1.0,
2240
+ "count": 298
2241
  },
2242
  "UD": {
2243
  "accuracy": 1.0,
2244
+ "count": 202
2245
  }
2246
  }
2247
  }
2248
  },
2249
  "summary": {
2250
+ "overall_accuracy": 0.9983333333333333,
2251
+ "total_examples": 2400,
2252
  "n_splits": 22
2253
  }
2254
  },
2255
+ "sorl_overall_accuracy": 0.9983333333333333,
2256
+ "sft_overall_accuracy": 0.7658333333333334
2257
  }
add_sub_sorl_v1_abs50_50K/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3807a271457535e90facd4a2c2b7452fb1470e8345fa33b069288d979eff66d5
3
  size 650466940
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6342cf5867d670c96b8fb7972956a9553f7a1f0ec1e2656c505d55780ccbe665
3
  size 650466940
add_sub_sorl_v1_abs50_50K/train_config.json CHANGED
@@ -1,35 +1,84 @@
1
  {
2
- "mode": "sorl",
3
- "ops": "add_sub",
4
- "n_digits": 6,
5
- "n_layer": 2,
6
- "n_head": 3,
7
- "n_embd": 510,
8
- "abs_vocab": 50,
9
  "K": 4,
 
 
 
 
 
 
10
  "alpha_info_gain": 10.0,
11
  "alpha_abs": 0.1,
12
  "alpha_soft_zipf": 1.0,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
13
  "batch_size": 64,
 
14
  "num_epochs": 10,
15
- "dataset_size": 50000,
16
- "lr": 8e-05,
 
 
 
17
  "output_dir": "ckpt/sweep/as_sorl_abs50_K4_50K",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
18
  "device": "cuda",
19
  "push_to_hub": true,
20
  "no_wandb": false,
21
  "n_params": 162540062,
22
  "run_name": "add_sub_sorl_v1_abs50_50K",
23
- "git_commit": "800625019270114adcda289bbd550c4f1109a514",
24
- "timestamp": "2026-04-12T03:52:52.696357+00:00",
25
  "tokenizer": "Qwen/Qwen3-0.6B",
26
  "dataset_repo": "thoughtworks/arithmetic-sorl-data",
27
  "dataset_config": "add_sub_6digit",
28
  "model_repo": "thoughtworks/arithmetic-sorl",
29
  "trainer_version": "v1",
30
- "wandb_run_id": "d8644t69",
31
- "wandb_url": "https://wandb.ai/nlp_and_interpretability/sorl-arithmetic/runs/d8644t69",
32
- "final_accuracy": 1.0,
33
- "sft_accuracy": 0.5107142857142857,
34
  "eval_method": "ArithmeticEvaluator"
35
  }
 
1
  {
2
+ "num_rollouts": 4,
 
 
 
 
 
 
3
  "K": 4,
4
+ "max_iterations": 2,
5
+ "memory_span_abs": 1792,
6
+ "memory_span_traj": 1792,
7
+ "temperature": 1.0,
8
+ "ar_search": false,
9
+ "response_only_abs": false,
10
  "alpha_info_gain": 10.0,
11
  "alpha_abs": 0.1,
12
  "alpha_soft_zipf": 1.0,
13
+ "alpha_ortho": 0.0,
14
+ "alpha_anchor": 0.0,
15
+ "alpha_jacobi": 0.0,
16
+ "decay": 0.8,
17
+ "target_vocab_util": 0.8,
18
+ "min_abs_ppl": 0.0,
19
+ "zipf_alpha": 1.0,
20
+ "lr": 4e-05,
21
+ "emb_lr_mult": 1.0,
22
+ "weight_decay": 0.01,
23
+ "warmup_steps": 234,
24
+ "cooldown_frac": 0.4,
25
+ "max_grad_norm": 1.0,
26
+ "vq_abs_pretrain_steps": 0,
27
+ "vq_abs_pretrain_lr": 0.001,
28
+ "vq_abs_pretrain_layer": -1,
29
+ "vq_abs_pretrain_batch_size": 256,
30
+ "vq_abs_pretrain_target_vectors": 20000,
31
  "batch_size": 64,
32
+ "gradient_accumulation_steps": 1,
33
  "num_epochs": 10,
34
+ "emb_warmup_steps": 0,
35
+ "log_every": 50,
36
+ "eval_every": 781,
37
+ "save_every": 999999,
38
+ "eval_samples": 100,
39
  "output_dir": "ckpt/sweep/as_sorl_abs50_K4_50K",
40
+ "eval_K": 4,
41
+ "alpha_traj": 0.0,
42
+ "corrupt_method": "shuffle",
43
+ "corrupt_ratio": 0.3,
44
+ "alpha_contrastive": 1.0,
45
+ "gamma_contrastive": 0.5,
46
+ "alpha_masked_traj": 0.0,
47
+ "mask_nl_ratio": 0.3,
48
+ "mask_nl_mode": "fixed",
49
+ "mask_nl_fixed_id": 0,
50
+ "use_ste": true,
51
+ "n_inner": 1,
52
+ "random_K": null,
53
+ "strip_suffix": null,
54
+ "compress_prefix": null,
55
+ "random_mem_span": null,
56
+ "warmup_ratio": 0.03,
57
+ "beta2": 0.999,
58
+ "seed": 42,
59
+ "n_digits": 6,
60
+ "n_layer": 2,
61
+ "n_head": 3,
62
+ "n_embd": 510,
63
+ "ops": "add_sub",
64
+ "abs_vocab": 50,
65
+ "dataset_size": 50000,
66
+ "mode": "sorl",
67
  "device": "cuda",
68
  "push_to_hub": true,
69
  "no_wandb": false,
70
  "n_params": 162540062,
71
  "run_name": "add_sub_sorl_v1_abs50_50K",
72
+ "git_commit": "f447da529caceac8c7d256cbb2cd185cbc50feac",
73
+ "timestamp": "2026-04-12T12:20:29.793903+00:00",
74
  "tokenizer": "Qwen/Qwen3-0.6B",
75
  "dataset_repo": "thoughtworks/arithmetic-sorl-data",
76
  "dataset_config": "add_sub_6digit",
77
  "model_repo": "thoughtworks/arithmetic-sorl",
78
  "trainer_version": "v1",
79
+ "wandb_run_id": "wtwip5r3",
80
+ "wandb_url": "https://wandb.ai/nlp_and_interpretability/sorl-arithmetic/runs/wtwip5r3",
81
+ "final_accuracy": 0.9983333333333333,
82
+ "sft_accuracy": 0.7658333333333334,
83
  "eval_method": "ArithmeticEvaluator"
84
  }