Timing1 commited on
Commit
6b1fcc5
·
verified ·
1 Parent(s): b9da35a

Upload folder using huggingface_hub

Browse files
Mambar/Base/checkpoint.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:171c72acc28ece4ba754497eb654a03065ab1cfb10d62ed9bb776791c8ff17ae
3
+ size 1792601134
Mambar/Base/checkpoint.pth.tar ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d888a50874a47176e13d84a69ef924d94a8ce06bdb8abb2209ed0a2f986642a4
3
+ size 49162696
Mambar/Base/config.txt ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ arch: mambar_base_patch16_224
2
+ batch_size_per_gpu: 64
3
+ clip_grad: 3.0
4
+ drop_path_rate: 0.1
5
+ epochs: 400
6
+ freeze_last_layer: 3
7
+ global_crops_scale: (0.25, 1.0)
8
+ gpu: 0
9
+ local_crops_number: 10
10
+ local_crops_scale: (0.05, 0.25)
11
+ local_rank: 0
12
+ lr: 0.00075
13
+ min_lr: 1e-06
14
+ momentum_teacher: 0.996
15
+ ngpus: 8
16
+ nodes: 2
17
+ norm_last_layer: True
18
+ num_workers: 10
19
+ optimizer: adamw
20
+ out_dim: 65536
21
+ patch_size: 16
22
+ rank: 0
23
+ saveckp_freq: 5
24
+ seed: 0
25
+ teacher_temp: 0.07
26
+ use_bn_in_head: False
27
+ use_fp16: True
28
+ use_volta32: False
29
+ warmup_epochs: 10
30
+ warmup_teacher_temp: 0.04
31
+ warmup_teacher_temp_epochs: 50
32
+ weight_decay: 0.04
33
+ weight_decay_end: 0.4
34
+ world_size: 16
Mambar/Base/log.txt ADDED
@@ -0,0 +1,387 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"train_loss": 8.637784875053867, "train_lr": 0.00014989207770405304, "train_wd": 0.04000184832683435, "epoch": 0}
2
+ {"train_loss": 5.633095048338198, "train_lr": 0.00044991606043648564, "train_wd": 0.04001294702294759, "epoch": 1}
3
+ {"train_loss": 5.1310941615193295, "train_lr": 0.000749940043168918, "train_wd": 0.04003514816830319, "epoch": 2}
4
+ {"train_loss": 8.087960571080423, "train_lr": 0.001049964025901351, "train_wd": 0.04006845039342992, "epoch": 3}
5
+ {"train_loss": 7.621806983253081, "train_lr": 0.001349988008633784, "train_wd": 0.04011285164408964, "epoch": 4}
6
+ {"train_loss": 6.403789825957837, "train_lr": 0.0016500119913662157, "train_wd": 0.04016834918140408, "epoch": 5}
7
+ {"train_loss": 5.733834925791819, "train_lr": 0.001950035974098649, "train_wd": 0.04023493958202372, "epoch": 6}
8
+ {"train_loss": 5.347950938722784, "train_lr": 0.0022500599568310814, "train_wd": 0.04031261873833893, "epoch": 7}
9
+ {"train_loss": 5.066360017450021, "train_lr": 0.0025500839395635145, "train_wd": 0.04040138185873359, "epoch": 8}
10
+ {"train_loss": 4.852225210550401, "train_lr": 0.002850107922295947, "train_wd": 0.04050122346788015, "epoch": 9}
11
+ {"train_loss": 4.67671491679766, "train_lr": 0.0029999838026699118, "train_wd": 0.04061213740707801, "epoch": 10}
12
+ {"train_loss": 4.53175099484688, "train_lr": 0.0029998865422038545, "train_wd": 0.04073411683463282, "epoch": 11}
13
+ {"train_loss": 4.417875208752713, "train_lr": 0.0029996919886937762, "train_wd": 0.040867154226278964, "epoch": 12}
14
+ {"train_loss": 4.324831972793519, "train_lr": 0.002999400154763969, "train_wd": 0.04101124137564353, "epoch": 13}
15
+ {"train_loss": 4.246375900664204, "train_lr": 0.0029990110593511414, "train_wd": 0.04116636939475232, "epoch": 14}
16
+ {"train_loss": 4.178796030503573, "train_lr": 0.0029985247277031202, "train_wd": 0.041332528714578515, "epoch": 15}
17
+ {"train_loss": 4.123293259518324, "train_lr": 0.0029979411913772626, "train_wd": 0.041509709085632535, "epoch": 16}
18
+ {"train_loss": 4.077983520883355, "train_lr": 0.0029972604882384166, "train_wd": 0.0416978995785944, "epoch": 17}
19
+ {"train_loss": 4.0401673916694545, "train_lr": 0.0029964826624564334, "train_wd": 0.041897088584988224, "epoch": 18}
20
+ {"train_loss": 4.010562509560375, "train_lr": 0.0029956077645033044, "train_wd": 0.04210726381789775, "epoch": 19}
21
+ {"train_loss": 3.9854510493106026, "train_lr": 0.0029946358511499164, "train_wd": 0.04232841231272449, "epoch": 20}
22
+ {"train_loss": 3.9652036193558735, "train_lr": 0.0029935669854623237, "train_wd": 0.042560520427987726, "epoch": 21}
23
+ {"train_loss": 3.947601104132849, "train_lr": 0.0029924012367976856, "train_wd": 0.042803573846165656, "epoch": 22}
24
+ {"train_loss": 3.9351046444605484, "train_lr": 0.0029911386807997807, "train_wd": 0.04305755757457835, "epoch": 23}
25
+ {"train_loss": 3.925088925827607, "train_lr": 0.00298977939939404, "train_wd": 0.04332245594631305, "epoch": 24}
26
+ {"train_loss": 3.9190836058651133, "train_lr": 0.0029883234807822987, "train_wd": 0.04359825262119076, "epoch": 25}
27
+ {"train_loss": 3.9176339993802762, "train_lr": 0.002986771019437023, "train_wd": 0.04388493058677311, "epoch": 26}
28
+ {"train_loss": 3.9152982651496484, "train_lr": 0.0029851221160952053, "train_wd": 0.044182472159412886, "epoch": 27}
29
+ {"train_loss": 3.916531576693868, "train_lr": 0.002983376877751814, "train_wd": 0.044490858985344404, "epoch": 28}
30
+ {"train_loss": 3.9185572913367683, "train_lr": 0.002981535417652882, "train_wd": 0.04481007204181546, "epoch": 29}
31
+ {"train_loss": 3.921876306644828, "train_lr": 0.002979597855288096, "train_wd": 0.045140091638261395, "epoch": 30}
32
+ {"train_loss": 3.9271574714343895, "train_lr": 0.002977564316383113, "train_wd": 0.04548089741751869, "epoch": 31}
33
+ {"train_loss": 3.9333651100012132, "train_lr": 0.0029754349328913556, "train_wd": 0.04583246835708167, "epoch": 32}
34
+ {"train_loss": 3.9402804658900825, "train_lr": 0.0029732098429854628, "train_wd": 0.04619478277039875, "epoch": 33}
35
+ {"train_loss": 3.952116961673581, "train_lr": 0.002970889191048336, "train_wd": 0.046567818308210114, "epoch": 34}
36
+ {"train_loss": 3.9622889224835913, "train_lr": 0.0029684731276637577, "train_wd": 0.046951551959926875, "epoch": 35}
37
+ {"train_loss": 3.9757145243249448, "train_lr": 0.0029659618096066057, "train_wd": 0.047345960055049645, "epoch": 36}
38
+ {"train_loss": 3.992285524388488, "train_lr": 0.0029633553998327203, "train_wd": 0.04775101826462935, "epoch": 37}
39
+ {"train_loss": 4.008188971226736, "train_lr": 0.0029606540674682893, "train_wd": 0.04816670160276764, "epoch": 38}
40
+ {"train_loss": 4.0273222257074215, "train_lr": 0.0029578579877989133, "train_wd": 0.048592984428158265, "epoch": 39}
41
+ {"train_loss": 4.047625695308335, "train_lr": 0.0029549673422581807, "train_wd": 0.04902984044566845, "epoch": 40}
42
+ {"train_loss": 4.072469926769022, "train_lr": 0.0029519823184159335, "train_wd": 0.04947724270796125, "epoch": 41}
43
+ {"train_loss": 4.096820257109799, "train_lr": 0.0029489031099660993, "train_wd": 0.04993516361715776, "epoch": 42}
44
+ {"train_loss": 4.123322501468906, "train_lr": 0.002945729916714115, "train_wd": 0.05040357492653923, "epoch": 43}
45
+ {"train_loss": 4.157062203597298, "train_lr": 0.0029424629445639165, "train_wd": 0.05088244774228973, "epoch": 44}
46
+ {"train_loss": 4.206582628136916, "train_lr": 0.0029391024055046705, "train_wd": 0.051371752525278355, "epoch": 45}
47
+ {"train_loss": 4.317350512642941, "train_lr": 0.0029356485175969184, "train_wd": 0.05187145909288109, "epoch": 46}
48
+ {"train_loss": 4.448395016334421, "train_lr": 0.002932101504958509, "train_wd": 0.05238153662084317, "epoch": 47}
49
+ {"train_loss": 4.556043886356979, "train_lr": 0.002928461597750018, "train_wd": 0.05290195364517991, "epoch": 48}
50
+ {"train_loss": 4.6499628172122796, "train_lr": 0.0029247290321597823, "train_wd": 0.05343267806411788, "epoch": 49}
51
+ {"train_loss": 4.6858804368977545, "train_lr": 0.0029209040503886527, "train_wd": 0.05397367714007509, "epoch": 50}
52
+ {"train_loss": 4.705584258400946, "train_lr": 0.002916986900634224, "train_wd": 0.05452491750168006, "epoch": 51}
53
+ {"train_loss": 4.714257818605784, "train_lr": 0.0029129778370747166, "train_wd": 0.05508636514583071, "epoch": 52}
54
+ {"train_loss": 4.7119163344089365, "train_lr": 0.0029088771198525114, "train_wd": 0.055657985439791856, "epoch": 53}
55
+ {"train_loss": 4.718173060152266, "train_lr": 0.002904685015057284, "train_wd": 0.05623974312333098, "epoch": 54}
56
+ {"train_loss": 4.715495297150741, "train_lr": 0.0029004017947086994, "train_wd": 0.05683160231089403, "epoch": 55}
57
+ {"train_loss": 4.71726435036968, "train_lr": 0.002896027736738807, "train_wd": 0.05743352649381821, "epoch": 56}
58
+ {"train_loss": 4.724034210165247, "train_lr": 0.0028915631249739407, "train_wd": 0.058045478542584836, "epoch": 57}
59
+ {"train_loss": 4.742459945303263, "train_lr": 0.002887008249116362, "train_wd": 0.058667420709108735, "epoch": 58}
60
+ {"train_loss": 4.768561949487403, "train_lr": 0.002882363404725456, "train_wd": 0.0592993146290676, "epoch": 59}
61
+ {"train_loss": 4.783723708143909, "train_lr": 0.0028776288931984854, "train_wd": 0.05994112132426791, "epoch": 60}
62
+ {"train_loss": 4.799492413822791, "train_lr": 0.002872805021751146, "train_wd": 0.06059280120504976, "epoch": 61}
63
+ {"train_loss": 4.809117233450655, "train_lr": 0.002867892103397529, "train_wd": 0.06125431407272825, "epoch": 62}
64
+ {"train_loss": 4.827439773080351, "train_lr": 0.0028628904569298827, "train_wd": 0.061925619122073595, "epoch": 63}
65
+ {"train_loss": 4.8564669941064365, "train_lr": 0.002857800406897867, "train_wd": 0.06260667494382822, "epoch": 64}
66
+ {"train_loss": 4.884930635241868, "train_lr": 0.0028526222835875276, "train_wd": 0.06329743952726108, "epoch": 65}
67
+ {"train_loss": 4.896211382749079, "train_lr": 0.0028473564229998805, "train_wd": 0.06399787026275884, "epoch": 66}
68
+ {"train_loss": 4.898126037608233, "train_lr": 0.00284200316682906, "train_wd": 0.06470792394445458, "epoch": 67}
69
+ {"train_loss": 4.907707621201242, "train_lr": 0.0028365628624401965, "train_wd": 0.06542755677289244, "epoch": 68}
70
+ {"train_loss": 4.924035449655984, "train_lr": 0.002831035862846838, "train_wd": 0.06615672435772965, "epoch": 69}
71
+ {"train_loss": 4.937764649542211, "train_lr": 0.0028254225266880722, "train_wd": 0.0668953817204749, "epoch": 70}
72
+ {"train_loss": 4.937171941442932, "train_lr": 0.0028197232182052357, "train_wd": 0.06764348329726301, "epoch": 71}
73
+ {"train_loss": 4.937672174579615, "train_lr": 0.0028139383072182987, "train_wd": 0.06840098294166454, "epoch": 72}
74
+ {"train_loss": 4.937207261745116, "train_lr": 0.002808068169101827, "train_wd": 0.0691678339275332, "epoch": 73}
75
+ {"train_loss": 4.9412580392867635, "train_lr": 0.0028021131847606844, "train_wd": 0.06994398895188833, "epoch": 74}
76
+ {"train_loss": 4.965779498505364, "train_lr": 0.0027960737406052716, "train_wd": 0.07072940013783183, "epoch": 75}
77
+ {"train_loss": 4.936880992780582, "train_lr": 0.0027899502285264523, "train_wd": 0.07152401903750212, "epoch": 76}
78
+ {"train_loss": 4.940866274322919, "train_lr": 0.002783743045870157, "train_wd": 0.07232779663506239, "epoch": 77}
79
+ {"train_loss": 4.943100978597272, "train_lr": 0.002777452595411585, "train_wd": 0.07314068334972461, "epoch": 78}
80
+ {"train_loss": 4.948584020471306, "train_lr": 0.002771079285329034, "train_wd": 0.07396262903880665, "epoch": 79}
81
+ {"train_loss": 4.951009390641936, "train_lr": 0.0027646235291774726, "train_wd": 0.07479358300082734, "epoch": 80}
82
+ {"train_loss": 4.954907455175615, "train_lr": 0.00275808574586166, "train_wd": 0.07563349397863156, "epoch": 81}
83
+ {"train_loss": 4.959115107473043, "train_lr": 0.002751466359608986, "train_wd": 0.07648231016255437, "epoch": 82}
84
+ {"train_loss": 4.963199247368615, "train_lr": 0.002744765799941942, "train_wd": 0.07733997919361478, "epoch": 83}
85
+ {"train_loss": 4.964840286558004, "train_lr": 0.002737984501650248, "train_wd": 0.07820644816674745, "epoch": 84}
86
+ {"train_loss": 4.968151657653751, "train_lr": 0.0027311229047626224, "train_wd": 0.07908166363406441, "epoch": 85}
87
+ {"train_loss": 4.974305803112561, "train_lr": 0.002724181454518261, "train_wd": 0.0799655716081529, "epoch": 86}
88
+ {"train_loss": 4.977017305928359, "train_lr": 0.002717160601337916, "train_wd": 0.08085811756540572, "epoch": 87}
89
+ {"train_loss": 4.983094227090061, "train_lr": 0.0027100608007946964, "train_wd": 0.08175924644938394, "epoch": 88}
90
+ {"train_loss": 4.9874478117358105, "train_lr": 0.0027028825135844755, "train_wd": 0.08266890267421322, "epoch": 89}
91
+ {"train_loss": 4.987364651988164, "train_lr": 0.002695626205496035, "train_wd": 0.08358703012801295, "epoch": 90}
92
+ {"train_loss": 4.990436220912339, "train_lr": 0.0026882923473808013, "train_wd": 0.08451357217635665, "epoch": 91}
93
+ {"train_loss": 4.995171819421218, "train_lr": 0.0026808814151223124, "train_wd": 0.08544847166576668, "epoch": 92}
94
+ {"train_loss": 4.997217367950389, "train_lr": 0.0026733938896053608, "train_wd": 0.08639167092723855, "epoch": 93}
95
+ {"train_loss": 5.038740194672875, "train_lr": 0.0026658302566847265, "train_wd": 0.08734311177979903, "epoch": 94}
96
+ {"train_loss": 5.014156195781023, "train_lr": 0.002658191007153721, "train_wd": 0.08830273553409476, "epoch": 95}
97
+ {"train_loss": 5.009222702680827, "train_lr": 0.0026504766367122933, "train_wd": 0.08927048299601234, "epoch": 96}
98
+ {"train_loss": 5.012783599080895, "train_lr": 0.0026426876459349014, "train_wd": 0.0902462944703294, "epoch": 97}
99
+ {"train_loss": 5.016705432002969, "train_lr": 0.0026348245402379733, "train_wd": 0.09123010976439835, "epoch": 98}
100
+ {"train_loss": 5.021137339462765, "train_lr": 0.002626887829847183, "train_wd": 0.09222186819185733, "epoch": 99}
101
+ {"train_loss": 5.022984991470973, "train_lr": 0.002618878029764289, "train_wd": 0.09322150857637478, "epoch": 100}
102
+ {"train_loss": 5.0258191209569345, "train_lr": 0.002610795659733746, "train_wd": 0.09422896925542353, "epoch": 101}
103
+ {"train_loss": 5.030008376764355, "train_lr": 0.002602641244208954, "train_wd": 0.0952441880840829, "epoch": 102}
104
+ {"train_loss": 5.034229690484482, "train_lr": 0.002594415312318255, "train_wd": 0.09626710243887358, "epoch": 103}
105
+ {"train_loss": 5.037663597140095, "train_lr": 0.0025861183978305854, "train_wd": 0.09729764922162, "epoch": 104}
106
+ {"train_loss": 5.038708233790432, "train_lr": 0.002577751039120829, "train_wd": 0.09833576486334186, "epoch": 105}
107
+ {"train_loss": 5.040633473846076, "train_lr": 0.0025693137791349087, "train_wd": 0.09938138532817689, "epoch": 106}
108
+ {"train_loss": 5.044556893033089, "train_lr": 0.0025608071653545257, "train_wd": 0.10043444611732918, "epoch": 107}
109
+ {"train_loss": 5.04665414549464, "train_lr": 0.002552231749761659, "train_wd": 0.10149488227304866, "epoch": 108}
110
+ {"train_loss": 5.050433608029577, "train_lr": 0.0025435880888027523, "train_wd": 0.10256262838263915, "epoch": 109}
111
+ {"train_loss": 5.052883165941346, "train_lr": 0.0025348767433525615, "train_wd": 0.10363761858248993, "epoch": 110}
112
+ {"train_loss": 5.05480886098864, "train_lr": 0.0025260982786778105, "train_wd": 0.10471978656214238, "epoch": 111}
113
+ {"train_loss": 5.058974848352938, "train_lr": 0.0025172532644004942, "train_wd": 0.10580906556837821, "epoch": 112}
114
+ {"train_loss": 5.062112297609651, "train_lr": 0.0025083422744609203, "train_wd": 0.1069053884093369, "epoch": 113}
115
+ {"train_loss": 5.0650221192293605, "train_lr": 0.0024993658870804485, "train_wd": 0.10800868745866157, "epoch": 114}
116
+ {"train_loss": 5.0681009875546446, "train_lr": 0.00249032468472399, "train_wd": 0.10911889465967017, "epoch": 115}
117
+ {"train_loss": 5.070849523793974, "train_lr": 0.002481219254062226, "train_wd": 0.11023594152955288, "epoch": 116}
118
+ {"train_loss": 5.07393309819422, "train_lr": 0.00247205018593348, "train_wd": 0.1113597591635967, "epoch": 117}
119
+ {"train_loss": 5.077277494539365, "train_lr": 0.0024628180753054627, "train_wd": 0.11249027823943662, "epoch": 118}
120
+ {"train_loss": 5.081458705196754, "train_lr": 0.0024535235212365916, "train_wd": 0.11362742902133077, "epoch": 119}
121
+ {"train_loss": 5.083277868948204, "train_lr": 0.002444167126837155, "train_wd": 0.11477114136446238, "epoch": 120}
122
+ {"train_loss": 5.088729355070326, "train_lr": 0.0024347494992301927, "train_wd": 0.11592134471926685, "epoch": 121}
123
+ {"train_loss": 5.090475154318493, "train_lr": 0.002425271249512061, "train_wd": 0.11707796813578324, "epoch": 122}
124
+ {"train_loss": 5.093144760953246, "train_lr": 0.0024157329927127964, "train_wd": 0.11824094026803104, "epoch": 123}
125
+ {"train_loss": 5.096025113555358, "train_lr": 0.0024061353477562043, "train_wd": 0.11941018937841129, "epoch": 124}
126
+ {"train_loss": 5.098238207024636, "train_lr": 0.0023964789374197383, "train_wd": 0.12058564334213075, "epoch": 125}
127
+ {"train_loss": 5.099690542756606, "train_lr": 0.0023867643882940033, "train_wd": 0.12176722965165207, "epoch": 126}
128
+ {"train_loss": 5.105195191457308, "train_lr": 0.0023769923307421724, "train_wd": 0.12295487542116657, "epoch": 127}
129
+ {"train_loss": 5.1075353466873645, "train_lr": 0.0023671633988590654, "train_wd": 0.12414850739108822, "epoch": 128}
130
+ {"train_loss": 5.1088118717300715, "train_lr": 0.0023572782304299884, "train_wd": 0.12534805193257537, "epoch": 129}
131
+ {"train_loss": 5.110424691252857, "train_lr": 0.002347337466889345, "train_wd": 0.1265534350520693, "epoch": 130}
132
+ {"train_loss": 5.111701018351922, "train_lr": 0.002337341753279037, "train_wd": 0.12776458239586194, "epoch": 131}
133
+ {"train_loss": 5.115474094542192, "train_lr": 0.00232729173820661, "train_wd": 0.12898141925467993, "epoch": 132}
134
+ {"train_loss": 5.119318662549285, "train_lr": 0.0023171880738031233, "train_wd": 0.13020387056829405, "epoch": 133}
135
+ {"train_loss": 5.121577044518636, "train_lr": 0.0023070314156808857, "train_wd": 0.131431860930149, "epoch": 134}
136
+ {"train_loss": 5.123207431855342, "train_lr": 0.0022968224228908933, "train_wd": 0.1326653145920152, "epoch": 135}
137
+ {"train_loss": 5.126235680328571, "train_lr": 0.0022865617578800516, "train_wd": 0.13390415546866058, "epoch": 136}
138
+ {"train_loss": 5.12730328156222, "train_lr": 0.0022762500864482115, "train_wd": 0.13514830714254386, "epoch": 137}
139
+ {"train_loss": 5.130745309172012, "train_lr": 0.0022658880777049546, "train_wd": 0.13639769286853004, "epoch": 138}
140
+ {"train_loss": 5.1327518000067185, "train_lr": 0.0022554764040261807, "train_wd": 0.1376522355786219, "epoch": 139}
141
+ {"train_loss": 5.134366833334632, "train_lr": 0.0022450157410104743, "train_wd": 0.13891185788671606, "epoch": 140}
142
+ {"train_loss": 5.1361980884195235, "train_lr": 0.002234506767435265, "train_wd": 0.14017648209337533, "epoch": 141}
143
+ {"train_loss": 5.13669639673355, "train_lr": 0.0022239501652127867, "train_wd": 0.1414460301906212, "epoch": 142}
144
+ {"train_loss": 5.139296575797071, "train_lr": 0.0022133466193458334, "train_wd": 0.14272042386674683, "epoch": 143}
145
+ {"train_loss": 5.1428935866561725, "train_lr": 0.0022026968178833033, "train_wd": 0.14399958451114783, "epoch": 144}
146
+ {"train_loss": 5.145059065019294, "train_lr": 0.002192001451875542, "train_wd": 0.14528343321917023, "epoch": 145}
147
+ {"train_loss": 5.145093682191545, "train_lr": 0.0021812612153295336, "train_wd": 0.14657189079697763, "epoch": 146}
148
+ {"train_loss": 5.147813194256416, "train_lr": 0.0021704768051638294, "train_wd": 0.14786487776643836, "epoch": 147}
149
+ {"train_loss": 5.149246137181251, "train_lr": 0.0021596489211633506, "train_wd": 0.14916231437002508, "epoch": 148}
150
+ {"train_loss": 5.151238352632065, "train_lr": 0.002148778265933976, "train_wd": 0.15046412057573721, "epoch": 149}
151
+ {"train_loss": 5.154652908194265, "train_lr": 0.0021378655448569487, "train_wd": 0.15177021608203492, "epoch": 150}
152
+ {"train_loss": 5.1537324655875505, "train_lr": 0.002126911466043091, "train_wd": 0.15308052032279595, "epoch": 151}
153
+ {"train_loss": 5.16021317141138, "train_lr": 0.002115916740286885, "train_wd": 0.1543949524722823, "epoch": 152}
154
+ {"train_loss": 5.157779362990702, "train_lr": 0.0021048820810203295, "train_wd": 0.15571343145012764, "epoch": 153}
155
+ {"train_loss": 5.157764540039759, "train_lr": 0.002093808204266648, "train_wd": 0.15703587592633758, "epoch": 154}
156
+ {"train_loss": 5.160089642262097, "train_lr": 0.002082695828593838, "train_wd": 0.15836220432630835, "epoch": 155}
157
+ {"train_loss": 5.161441784468201, "train_lr": 0.002071545675068029, "train_wd": 0.15969233483585576, "epoch": 156}
158
+ {"train_loss": 5.161002433986115, "train_lr": 0.0020603584672067065, "train_wd": 0.16102618540626526, "epoch": 157}
159
+ {"train_loss": 5.1620103516500535, "train_lr": 0.0020491349309317486, "train_wd": 0.16236367375935024, "epoch": 158}
160
+ {"train_loss": 5.164971074207033, "train_lr": 0.0020378757945223513, "train_wd": 0.16370471739252893, "epoch": 159}
161
+ {"train_loss": 5.164828603049453, "train_lr": 0.002026581788567735, "train_wd": 0.16504923358391366, "epoch": 160}
162
+ {"train_loss": 5.163869374733177, "train_lr": 0.002015253645919768, "train_wd": 0.16639713939741188, "epoch": 161}
163
+ {"train_loss": 5.164344825904718, "train_lr": 0.0020038921016453824, "train_wd": 0.1677483516878441, "epoch": 162}
164
+ {"train_loss": 5.164674375911982, "train_lr": 0.001992497892978911, "train_wd": 0.16910278710607163, "epoch": 163}
165
+ {"train_loss": 5.165384127820234, "train_lr": 0.0019810717592742295, "train_wd": 0.17046036210413787, "epoch": 164}
166
+ {"train_loss": 5.165045586111639, "train_lr": 0.001969614441956772, "train_wd": 0.1718209929404218, "epoch": 165}
167
+ {"train_loss": 5.168556304000836, "train_lr": 0.001958126684475442, "train_wd": 0.1731845956848044, "epoch": 166}
168
+ {"train_loss": 5.168179201446087, "train_lr": 0.0019466092322543667, "train_wd": 0.17455108622384533, "epoch": 167}
169
+ {"train_loss": 5.1679782578699305, "train_lr": 0.0019350628326445037, "train_wd": 0.1759203802659719, "epoch": 168}
170
+ {"train_loss": 5.166809007989989, "train_lr": 0.0019234882348751836, "train_wd": 0.1772923933466772, "epoch": 169}
171
+ {"train_loss": 5.168555745808817, "train_lr": 0.0019118861900054686, "train_wd": 0.17866704083373156, "epoch": 170}
172
+ {"train_loss": 5.170631839431447, "train_lr": 0.0019002574508754236, "train_wd": 0.18004423793240237, "epoch": 171}
173
+ {"train_loss": 5.1686469061816815, "train_lr": 0.0018886027720572674, "train_wd": 0.18142389969068656, "epoch": 172}
174
+ {"train_loss": 5.179082334994508, "train_lr": 0.0018769229098064056, "train_wd": 0.18280594100454756, "epoch": 173}
175
+ {"train_loss": 5.172065630305013, "train_lr": 0.001865218622012359, "train_wd": 0.18419027662316695, "epoch": 174}
176
+ {"train_loss": 5.172670949253438, "train_lr": 0.0018534906681495903, "train_wd": 0.18557682115420307, "epoch": 175}
177
+ {"train_loss": 5.172535467562344, "train_lr": 0.0018417398092282276, "train_wd": 0.18696548906905788, "epoch": 176}
178
+ {"train_loss": 5.170949884932295, "train_lr": 0.0018299668077446532, "train_wd": 0.18835619470815332, "epoch": 177}
179
+ {"train_loss": 5.170384844787401, "train_lr": 0.001818172427632073, "train_wd": 0.18974885228621524, "epoch": 178}
180
+ {"train_loss": 5.171376506701933, "train_lr": 0.0018063574342109087, "train_wd": 0.19114337589756344, "epoch": 179}
181
+ {"train_loss": 5.17260210000449, "train_lr": 0.0017945225941391409, "train_wd": 0.1925396795214132, "epoch": 180}
182
+ {"train_loss": 5.170950078849884, "train_lr": 0.0017826686753625938, "train_wd": 0.19393767702717982, "epoch": 181}
183
+ {"train_loss": 5.171539771137573, "train_lr": 0.001770796447065067, "train_wd": 0.19533728217979157, "epoch": 182}
184
+ {"train_loss": 5.171516598200054, "train_lr": 0.0017589066796184377, "train_wd": 0.19673840864500997, "epoch": 183}
185
+ {"train_loss": 5.171016397545759, "train_lr": 0.0017470001445326817, "train_wd": 0.19814096999475622, "epoch": 184}
186
+ {"train_loss": 5.16912194038276, "train_lr": 0.0017350776144057975, "train_wd": 0.19954487971243742, "epoch": 185}
187
+ {"train_loss": 5.166941123281261, "train_lr": 0.0017231398628736743, "train_wd": 0.2009500511982903, "epoch": 186}
188
+ {"train_loss": 5.169427223581014, "train_lr": 0.0017111876645599085, "train_wd": 0.20235639777471853, "epoch": 187}
189
+ {"train_loss": 5.091156020415106, "train_lr": 0.0008498265702808308, "train_wd": 0.2037641140566197, "epoch": 188}
190
+ {"train_loss": 5.074340996815622, "train_lr": 0.0008438391840046157, "train_wd": 0.2051725506882831, "epoch": 189}
191
+ {"train_loss": 5.097286776196566, "train_lr": 0.0008378457410825078, "train_wd": 0.20658190194686343, "epoch": 190}
192
+ {"train_loss": 5.1169881571254, "train_lr": 0.0008318466304204374, "train_wd": 0.2079920808969362, "epoch": 191}
193
+ {"train_loss": 5.133275799709353, "train_lr": 0.0008258422412920895, "train_wd": 0.20940300055202227, "epoch": 192}
194
+ {"train_loss": 5.143341844292472, "train_lr": 0.0008198329633136755, "train_wd": 0.2108145738799509, "epoch": 193}
195
+ {"train_loss": 5.1502472004778, "train_lr": 0.0008138191864186288, "train_wd": 0.2122267138082284, "epoch": 194}
196
+ {"train_loss": 5.153045735032343, "train_lr": 0.0008078013008323177, "train_wd": 0.2136393332294141, "epoch": 195}
197
+ {"train_loss": 5.156373023105373, "train_lr": 0.000801779697046708, "train_wd": 0.21505234500648884, "epoch": 196}
198
+ {"train_loss": 5.158538863265353, "train_lr": 0.0007957547657950476, "train_wd": 0.21646566197822822, "epoch": 197}
199
+ {"train_loss": 5.159798114896297, "train_lr": 0.0007897268980264856, "train_wd": 0.21787919696458521, "epoch": 198}
200
+ {"train_loss": 5.15958246436241, "train_lr": 0.0007836964848807235, "train_wd": 0.21929286277206284, "epoch": 199}
201
+ {"train_loss": 5.158015418514836, "train_lr": 0.0007776639176626316, "train_wd": 0.2207065721990966, "epoch": 200}
202
+ {"train_loss": 5.157515886495058, "train_lr": 0.0007716295878168495, "train_wd": 0.22212023804142747, "epoch": 201}
203
+ {"train_loss": 5.158735573887348, "train_lr": 0.0007655938869023945, "train_wd": 0.22353377309748948, "epoch": 202}
204
+ {"train_loss": 5.159842118442201, "train_lr": 0.0007595572065672457, "train_wd": 0.22494709017378173, "epoch": 203}
205
+ {"train_loss": 5.157648079948936, "train_lr": 0.0007535199385229474, "train_wd": 0.226360102090248, "epoch": 204}
206
+ {"train_loss": 5.155930278803424, "train_lr": 0.0007474824745191613, "train_wd": 0.22777272168565932, "epoch": 205}
207
+ {"train_loss": 5.156330907802216, "train_lr": 0.0007414452063182832, "train_wd": 0.22918486182298461, "epoch": 206}
208
+ {"train_loss": 5.152855788155806, "train_lr": 0.0007354085256699883, "train_wd": 0.23059643539476835, "epoch": 207}
209
+ {"train_loss": 5.151917979204588, "train_lr": 0.0007293728242858365, "train_wd": 0.2320073553285019, "epoch": 208}
210
+ {"train_loss": 5.150041867741387, "train_lr": 0.0007233384938138418, "train_wd": 0.23341753459200015, "epoch": 209}
211
+ {"train_loss": 5.148483486889268, "train_lr": 0.0007173059258130587, "train_wd": 0.2348268861987621, "epoch": 210}
212
+ {"train_loss": 5.147640997485863, "train_lr": 0.0007112755117281798, "train_wd": 0.23623532321334312, "epoch": 211}
213
+ {"train_loss": 5.146305283839754, "train_lr": 0.0007052476428641331, "train_wd": 0.2376427587567114, "epoch": 212}
214
+ {"train_loss": 5.144308296991862, "train_lr": 0.0006992227103606954, "train_wd": 0.23904910601161666, "epoch": 213}
215
+ {"train_loss": 5.14037477448404, "train_lr": 0.0006932011051670964, "train_wd": 0.24045427822793347, "epoch": 214}
216
+ {"train_loss": 5.138576725451685, "train_lr": 0.0006871832180166713, "train_wd": 0.24185818872801984, "epoch": 215}
217
+ {"train_loss": 5.137665674149942, "train_lr": 0.0006811694394014925, "train_wd": 0.243260750912065, "epoch": 216}
218
+ {"train_loss": 5.1363301173769695, "train_lr": 0.0006751601595470362, "train_wd": 0.2446618782634265, "epoch": 217}
219
+ {"train_loss": 5.133028356601104, "train_lr": 0.0006691557683868604, "train_wd": 0.24606148435396777, "epoch": 218}
220
+ {"train_loss": 5.130677510603822, "train_lr": 0.0006631566555373037, "train_wd": 0.2474594828493942, "epoch": 219}
221
+ {"train_loss": 5.127656989984756, "train_lr": 0.0006571632102722034, "train_wd": 0.24885578751457296, "epoch": 220}
222
+ {"train_loss": 5.1263827938113, "train_lr": 0.0006511758214976268, "train_wd": 0.2502503122188545, "epoch": 221}
223
+ {"train_loss": 5.12371546544617, "train_lr": 0.0006451948777266588, "train_wd": 0.2516429709413868, "epoch": 222}
224
+ {"train_loss": 5.120851164217666, "train_lr": 0.0006392207670541658, "train_wd": 0.2530336777764206, "epoch": 223}
225
+ {"train_loss": 5.1169206816658415, "train_lr": 0.0006332538771316324, "train_wd": 0.2544223469386053, "epoch": 224}
226
+ {"train_loss": 5.115419379860568, "train_lr": 0.000627294595141991, "train_wd": 0.2558088927682875, "epoch": 225}
227
+ {"train_loss": 5.1108370521705115, "train_lr": 0.0006213433077745081, "train_wd": 0.2571932297367883, "epoch": 226}
228
+ {"train_loss": 5.10864352238931, "train_lr": 0.0006154004011996976, "train_wd": 0.25857527245168443, "epoch": 227}
229
+ {"train_loss": 5.107386470245991, "train_lr": 0.0006094662610442453, "train_wd": 0.25995493566206923, "epoch": 228}
230
+ {"train_loss": 5.1053868394246775, "train_lr": 0.0006035412723660057, "train_wd": 0.26133213426381785, "epoch": 229}
231
+ {"train_loss": 5.1019349890075425, "train_lr": 0.0005976258196290032, "train_wd": 0.2627067833048336, "epoch": 230}
232
+ {"train_loss": 5.100072723450801, "train_lr": 0.0005917202866784867, "train_wd": 0.26407879799028827, "epoch": 231}
233
+ {"train_loss": 5.095352543153161, "train_lr": 0.0005858250567160279, "train_wd": 0.26544809368785205, "epoch": 232}
234
+ {"train_loss": 5.092102071959719, "train_lr": 0.0005799405122746496, "train_wd": 0.266814585932919, "epoch": 233}
235
+ {"train_loss": 5.08918897908845, "train_lr": 0.0005740670351940112, "train_wd": 0.26817819043380836, "epoch": 234}
236
+ {"train_loss": 5.085278718329543, "train_lr": 0.0005682050065956177, "train_wd": 0.26953882307697197, "epoch": 235}
237
+ {"train_loss": 5.082459406219988, "train_lr": 0.0005623548068581079, "train_wd": 0.27089639993218084, "epoch": 236}
238
+ {"train_loss": 5.079539365167145, "train_lr": 0.0005565168155925589, "train_wd": 0.27225083725769716, "epoch": 237}
239
+ {"train_loss": 5.074885640022376, "train_lr": 0.0005506914116178581, "train_wd": 0.2736020515054495, "epoch": 238}
240
+ {"train_loss": 5.070625886023283, "train_lr": 0.0005448789729361201, "train_wd": 0.2749499593261752, "epoch": 239}
241
+ {"train_loss": 5.067727992908179, "train_lr": 0.0005390798767081622, "train_wd": 0.2762944775745731, "epoch": 240}
242
+ {"train_loss": 5.065570102321158, "train_lr": 0.000533294499229026, "train_wd": 0.2776355233144227, "epoch": 241}
243
+ {"train_loss": 5.061097588661096, "train_lr": 0.0005275232159035702, "train_wd": 0.27897301382370754, "epoch": 242}
244
+ {"train_loss": 5.057949278518546, "train_lr": 0.000521766401222094, "train_wd": 0.2803068665997115, "epoch": 243}
245
+ {"train_loss": 5.054585099053516, "train_lr": 0.0005160244287360554, "train_wd": 0.28163699936411407, "epoch": 244}
246
+ {"train_loss": 5.050628634856092, "train_lr": 0.0005102976710338187, "train_wd": 0.28296333006805835, "epoch": 245}
247
+ {"train_loss": 5.046271638761607, "train_lr": 0.0005045864997164855, "train_wd": 0.2842857768972205, "epoch": 246}
248
+ {"train_loss": 5.041309315285427, "train_lr": 0.000498891285373778, "train_wd": 0.28560425827685115, "epoch": 247}
249
+ {"train_loss": 5.039088412488012, "train_lr": 0.000493212397559995, "train_wd": 0.28691869287680605, "epoch": 248}
250
+ {"train_loss": 5.034920222157959, "train_lr": 0.0004875502047700239, "train_wd": 0.28822899961657056, "epoch": 249}
251
+ {"train_loss": 5.031195666340234, "train_lr": 0.00048190507441544584, "train_wd": 0.28953509767025165, "epoch": 250}
252
+ {"train_loss": 5.0278924695974725, "train_lr": 0.00047627737280067536, "train_wd": 0.29083690647156873, "epoch": 251}
253
+ {"train_loss": 5.022235716418397, "train_lr": 0.0004706674650992103, "train_wd": 0.2921343457188231, "epoch": 252}
254
+ {"train_loss": 5.019888596926376, "train_lr": 0.0004650757153299159, "train_wd": 0.293427335379849, "epoch": 253}
255
+ {"train_loss": 5.015133864897713, "train_lr": 0.00045950248633342745, "train_wd": 0.29471579569695666, "epoch": 254}
256
+ {"train_loss": 5.0107867040460725, "train_lr": 0.0004539481397485846, "train_wd": 0.2959996471918429, "epoch": 255}
257
+ {"train_loss": 5.005873859881593, "train_lr": 0.00044841303598897823, "train_wd": 0.2972788106704991, "epoch": 256}
258
+ {"train_loss": 5.001143803842348, "train_lr": 0.0004428975342195577, "train_wd": 0.2985532072280974, "epoch": 257}
259
+ {"train_loss": 4.993955240642234, "train_lr": 0.0004374019923333321, "train_wd": 0.29982275825385585, "epoch": 258}
260
+ {"train_loss": 4.990069762193899, "train_lr": 0.00043192676692813543, "train_wd": 0.30108738543588637, "epoch": 259}
261
+ {"train_loss": 4.983701609354988, "train_lr": 0.0004264722132834999, "train_wd": 0.3023470107660269, "epoch": 260}
262
+ {"train_loss": 4.979862540555325, "train_lr": 0.00042103868533759526, "train_wd": 0.30360155654465537, "epoch": 261}
263
+ {"train_loss": 4.974370903438992, "train_lr": 0.0004156265356642622, "train_wd": 0.30485094538547675, "epoch": 262}
264
+ {"train_loss": 4.969085089022593, "train_lr": 0.0004102361154501367, "train_wd": 0.30609510022030406, "epoch": 263}
265
+ {"train_loss": 4.964561837468501, "train_lr": 0.000404867774471865, "train_wd": 0.3073339443038037, "epoch": 264}
266
+ {"train_loss": 4.959437264646176, "train_lr": 0.0003995218610733946, "train_wd": 0.3085674012182414, "epoch": 265}
267
+ {"train_loss": 4.95331798475995, "train_lr": 0.000394198722143389, "train_wd": 0.30979539487818164, "epoch": 266}
268
+ {"train_loss": 4.948438049649163, "train_lr": 0.00038889870309270395, "train_wd": 0.31101784953519124, "epoch": 267}
269
+ {"train_loss": 4.943596207361808, "train_lr": 0.0003836221478319808, "train_wd": 0.31223468978250896, "epoch": 268}
270
+ {"train_loss": 4.937840783624626, "train_lr": 0.0003783693987493274, "train_wd": 0.31344584055969793, "epoch": 269}
271
+ {"train_loss": 4.932893885506524, "train_lr": 0.0003731407966881066, "train_wd": 0.3146512271572712, "epoch": 270}
272
+ {"train_loss": 4.928088319554127, "train_lr": 0.00036793668092481097, "train_wd": 0.31585077522130556, "epoch": 271}
273
+ {"train_loss": 4.92392223392078, "train_lr": 0.00036275738914705503, "train_wd": 0.31704441075802686, "epoch": 272}
274
+ {"train_loss": 4.916985667342667, "train_lr": 0.0003576032574316618, "train_wd": 0.31823206013837346, "epoch": 273}
275
+ {"train_loss": 4.911200050755943, "train_lr": 0.00035247462022285054, "train_wd": 0.3194136501025365, "epoch": 274}
276
+ {"train_loss": 4.905656064299943, "train_lr": 0.0003473718103105396, "train_wd": 0.32058910776448063, "epoch": 275}
277
+ {"train_loss": 4.89873350981614, "train_lr": 0.0003422951588087524, "train_wd": 0.3217583606164405, "epoch": 276}
278
+ {"train_loss": 4.893262678913647, "train_lr": 0.00033724499513413184, "train_wd": 0.32292133653339306, "epoch": 277}
279
+ {"train_loss": 4.887584132160977, "train_lr": 0.00033222164698455746, "train_wd": 0.3240779637775073, "epoch": 278}
280
+ {"train_loss": 4.881265171068749, "train_lr": 0.00032722544031789385, "train_wd": 0.32522817100256185, "epoch": 279}
281
+ {"train_loss": 4.875934096572878, "train_lr": 0.00032225669933083243, "train_wd": 0.32637188725836164, "epoch": 280}
282
+ {"train_loss": 4.868471115922851, "train_lr": 0.00031731574643785644, "train_wd": 0.3275090419950986, "epoch": 281}
283
+ {"train_loss": 4.8624490595740575, "train_lr": 0.0003124029022503148, "train_wd": 0.3286395650677133, "epoch": 282}
284
+ {"train_loss": 4.855783086445787, "train_lr": 0.00030751848555562983, "train_wd": 0.3297633867402155, "epoch": 283}
285
+ {"train_loss": 4.85036742828971, "train_lr": 0.0003026628132965996, "train_wd": 0.3308804376899928, "epoch": 284}
286
+ {"train_loss": 4.843636494686754, "train_lr": 0.0002978362005508379, "train_wd": 0.33199064901207925, "epoch": 285}
287
+ {"train_loss": 4.836789924011146, "train_lr": 0.00029303896051033107, "train_wd": 0.33309395222341115, "epoch": 286}
288
+ {"train_loss": 4.830869138228903, "train_lr": 0.00028827140446110924, "train_wd": 0.3341902792670508, "epoch": 287}
289
+ {"train_loss": 4.823843292778821, "train_lr": 0.00028353384176305264, "train_wd": 0.33527956251638, "epoch": 288}
290
+ {"train_loss": 4.816310359205273, "train_lr": 0.0002788265798298155, "train_wd": 0.3363617347792796, "epoch": 289}
291
+ {"train_loss": 4.811116400418236, "train_lr": 0.0002741499241088787, "train_wd": 0.3374367293022637, "epoch": 290}
292
+ {"train_loss": 4.8042942608693995, "train_lr": 0.00026950417806172997, "train_wd": 0.33850447977460785, "epoch": 291}
293
+ {"train_loss": 4.797446650805043, "train_lr": 0.00026488964314417304, "train_wd": 0.3395649203324349, "epoch": 292}
294
+ {"train_loss": 4.789914706080175, "train_lr": 0.00026030661878676556, "train_wd": 0.34061798556277467, "epoch": 293}
295
+ {"train_loss": 4.782356360035358, "train_lr": 0.00025575540237539123, "train_wd": 0.3416636105076024, "epoch": 294}
296
+ {"train_loss": 4.776044220137272, "train_lr": 0.0002512362892319595, "train_wd": 0.34270173066784837, "epoch": 295}
297
+ {"train_loss": 4.769099719149413, "train_lr": 0.0002467495725952468, "train_wd": 0.34373228200736883, "epoch": 296}
298
+ {"train_loss": 4.759538625677426, "train_lr": 0.00024229554360186628, "train_wd": 0.3447552009569052, "epoch": 297}
299
+ {"train_loss": 4.752294977386888, "train_lr": 0.0002378744912673752, "train_wd": 0.3457704244179973, "epoch": 298}
300
+ {"train_loss": 4.74378167670503, "train_lr": 0.00023348670246752583, "train_wd": 0.3467778897668786, "epoch": 299}
301
+ {"train_loss": 4.738346022786759, "train_lr": 0.00022913246191964378, "train_wd": 0.3477775348583425, "epoch": 300}
302
+ {"train_loss": 4.730807079649944, "train_lr": 0.00022481205216415992, "train_wd": 0.34876929802957, "epoch": 301}
303
+ {"train_loss": 4.723629600948376, "train_lr": 0.00022052575354627007, "train_wd": 0.3497531181039364, "epoch": 302}
304
+ {"train_loss": 4.713962466965953, "train_lr": 0.00021627384419775031, "train_wd": 0.3507289343947893, "epoch": 303}
305
+ {"train_loss": 4.706370792205004, "train_lr": 0.0002120566000189049, "train_wd": 0.3516966867091784, "epoch": 304}
306
+ {"train_loss": 4.6989149204808935, "train_lr": 0.00020787429466066396, "train_wd": 0.35265631535158454, "epoch": 305}
307
+ {"train_loss": 4.689762066915739, "train_lr": 0.00020372719950683017, "train_wd": 0.35360776112759357, "epoch": 306}
308
+ {"train_loss": 4.681749886734118, "train_lr": 0.00019961558365646416, "train_wd": 0.354550965347545, "epoch": 307}
309
+ {"train_loss": 4.6752469475082545, "train_lr": 0.0001955397139064269, "train_wd": 0.35548586983016583, "epoch": 308}
310
+ {"train_loss": 4.66559200422417, "train_lr": 0.00019149985473406505, "train_wd": 0.35641241690613634, "epoch": 309}
311
+ {"train_loss": 4.65597446105606, "train_lr": 0.00018749626828005051, "train_wd": 0.3573305494216757, "epoch": 310}
312
+ {"train_loss": 4.646840298907172, "train_lr": 0.00018352921433137216, "train_wd": 0.3582402107420411, "epoch": 311}
313
+ {"train_loss": 4.63809587612903, "train_lr": 0.00017959895030447508, "train_wd": 0.35914134475503834, "epoch": 312}
314
+ {"train_loss": 4.628993505684973, "train_lr": 0.00017570573122855968, "train_wd": 0.360033895874476, "epoch": 313}
315
+ {"train_loss": 4.620042588237188, "train_lr": 0.00017184980972903216, "train_wd": 0.3609178090435984, "epoch": 314}
316
+ {"train_loss": 4.611121477900173, "train_lr": 0.0001680314360111131, "train_wd": 0.36179302973847705, "epoch": 315}
317
+ {"train_loss": 4.603098225131404, "train_lr": 0.00016425085784360193, "train_wd": 0.36265950397137564, "epoch": 316}
318
+ {"train_loss": 4.594411970185433, "train_lr": 0.00016050832054279753, "train_wd": 0.3635171782940824, "epoch": 317}
319
+ {"train_loss": 4.583315129200522, "train_lr": 0.00015680406695658212, "train_wd": 0.3643659998012077, "epoch": 318}
320
+ {"train_loss": 4.573659105719232, "train_lr": 0.00015313833744866188, "train_wd": 0.36520591613344044, "epoch": 319}
321
+ {"train_loss": 4.563590654842764, "train_lr": 0.00014951136988297273, "train_wd": 0.3660368754807849, "epoch": 320}
322
+ {"train_loss": 4.552846900707812, "train_lr": 0.00014592339960824152, "train_wd": 0.3668588265857537, "epoch": 321}
323
+ {"train_loss": 4.543069284656446, "train_lr": 0.00014237465944271735, "train_wd": 0.36767171874653265, "epoch": 322}
324
+ {"train_loss": 4.533651805895982, "train_lr": 0.00013886537965906472, "train_wd": 0.36847550182010247, "epoch": 323}
325
+ {"train_loss": 4.5218538625491895, "train_lr": 0.0001353957879694187, "train_wd": 0.3692701262253386, "epoch": 324}
326
+ {"train_loss": 4.512148304296722, "train_lr": 0.00013196610951061302, "train_wd": 0.3700555429460629, "epoch": 325}
327
+ {"train_loss": 4.501101960047639, "train_lr": 0.00012857656682956813, "train_wd": 0.3708317035340753, "epoch": 326}
328
+ {"train_loss": 4.490569316607108, "train_lr": 0.0001252273798688496, "train_wd": 0.3715985601121337, "epoch": 327}
329
+ {"train_loss": 4.480329731623713, "train_lr": 0.00012191876595240248, "train_wd": 0.3723560653769096, "epoch": 328}
330
+ {"train_loss": 4.469525034836442, "train_lr": 0.00011865093977143931, "train_wd": 0.37310417260191303, "epoch": 329}
331
+ {"train_loss": 4.458020923997191, "train_lr": 0.00011542411337051996, "train_wd": 0.3738428356403647, "epoch": 330}
332
+ {"train_loss": 4.447403555627254, "train_lr": 0.00011223849613378463, "train_wd": 0.3745720089280498, "epoch": 331}
333
+ {"train_loss": 4.436236642176013, "train_lr": 0.00010909429477137107, "train_wd": 0.37529164748612476, "epoch": 332}
334
+ {"train_loss": 4.425950154685955, "train_lr": 0.00010599171330599913, "train_wd": 0.3760017069238934, "epoch": 333}
335
+ {"train_loss": 4.412479007749154, "train_lr": 0.00010293095305973491, "train_wd": 0.37670214344154507, "epoch": 334}
336
+ {"train_loss": 4.4002665858283985, "train_lr": 9.991221264092395e-05, "train_wd": 0.3773929138328577, "epoch": 335}
337
+ {"train_loss": 4.3889885223407346, "train_lr": 9.693568793130585e-05, "train_wd": 0.37807397548785676, "epoch": 336}
338
+ {"train_loss": 4.378458981009887, "train_lr": 9.400157207330372e-05, "train_wd": 0.3787452863954541, "epoch": 337}
339
+ {"train_loss": 4.364677319888303, "train_lr": 9.111005545749096e-05, "train_wd": 0.37940680514602987, "epoch": 338}
340
+ {"train_loss": 4.352803270033986, "train_lr": 8.8261325710237e-05, "train_wd": 0.38005849093398913, "epoch": 339}
341
+ {"train_loss": 4.3400576879247295, "train_lr": 8.545556768153266e-05, "train_wd": 0.3807003035602873, "epoch": 340}
342
+ {"train_loss": 4.326367753991883, "train_lr": 8.269296343299616e-05, "train_wd": 0.38133220343489477, "epoch": 341}
343
+ {"train_loss": 4.314305759162354, "train_lr": 7.997369222605725e-05, "train_wd": 0.3819541515792518, "epoch": 342}
344
+ {"train_loss": 4.3017936556292575, "train_lr": 7.729793051032811e-05, "train_wd": 0.3825661096286652, "epoch": 343}
345
+ {"train_loss": 4.289358854591608, "train_lr": 7.466585191215186e-05, "train_wd": 0.38316803983468506, "epoch": 344}
346
+ {"train_loss": 4.2768534882772835, "train_lr": 7.20776272233374e-05, "train_wd": 0.38375990506741586, "epoch": 345}
347
+ {"train_loss": 4.262919721140754, "train_lr": 6.953342439007514e-05, "train_wd": 0.3843416688178255, "epoch": 346}
348
+ {"train_loss": 4.249351487921582, "train_lr": 6.703340850204112e-05, "train_wd": 0.38491329519998413, "epoch": 347}
349
+ {"train_loss": 4.23633065655363, "train_lr": 6.45777417816836e-05, "train_wd": 0.38547474895328326, "epoch": 348}
350
+ {"train_loss": 4.222715559051477, "train_lr": 6.216658357369685e-05, "train_wd": 0.38602599544461075, "epoch": 349}
351
+ {"train_loss": 4.2100277894216, "train_lr": 5.980009033468189e-05, "train_wd": 0.3865670006704875, "epoch": 350}
352
+ {"train_loss": 4.196193649745483, "train_lr": 5.747841562299365e-05, "train_wd": 0.38709773125916164, "epoch": 351}
353
+ {"train_loss": 4.182188350364839, "train_lr": 5.5201710088776864e-05, "train_wd": 0.38761815447267195, "epoch": 352}
354
+ {"train_loss": 4.169940389246106, "train_lr": 5.2970121464191254e-05, "train_wd": 0.38812823820886205, "epoch": 353}
355
+ {"train_loss": 4.1539944999700165, "train_lr": 5.078379455382448e-05, "train_wd": 0.3886279510033651, "epoch": 354}
356
+ {"train_loss": 4.141453638077259, "train_lr": 4.864287122529673e-05, "train_wd": 0.38911726203154107, "epoch": 355}
357
+ {"train_loss": 4.128194481420288, "train_lr": 4.654749040005499e-05, "train_wd": 0.389596141110381, "epoch": 356}
358
+ {"train_loss": 4.112860511937778, "train_lr": 4.449778804435772e-05, "train_wd": 0.3900645587003693, "epoch": 357}
359
+ {"train_loss": 4.098872231458016, "train_lr": 4.249389716045357e-05, "train_wd": 0.39052248590730043, "epoch": 358}
360
+ {"train_loss": 4.085434906297832, "train_lr": 4.053594777795074e-05, "train_wd": 0.3909698944840693, "epoch": 359}
361
+ {"train_loss": 4.0719569846332595, "train_lr": 3.862406694537818e-05, "train_wd": 0.3914067568324056, "epoch": 360}
362
+ {"train_loss": 4.056023749599545, "train_lr": 3.675837872194365e-05, "train_wd": 0.3918330460045821, "epoch": 361}
363
+ {"train_loss": 4.041581639676071, "train_lr": 3.4939004169482324e-05, "train_wd": 0.3922487357050755, "epoch": 362}
364
+ {"train_loss": 4.027914153324138, "train_lr": 3.316606134460145e-05, "train_wd": 0.3926538002921871, "epoch": 363}
365
+ {"train_loss": 4.014938752035157, "train_lr": 3.143966529102055e-05, "train_wd": 0.39304821477962415, "epoch": 364}
366
+ {"train_loss": 4.001450709873538, "train_lr": 2.975992803210509e-05, "train_wd": 0.3934319548380432, "epoch": 365}
367
+ {"train_loss": 3.988283786175253, "train_lr": 2.8126958563599086e-05, "train_wd": 0.3938049967965514, "epoch": 366}
368
+ {"train_loss": 3.972151799513091, "train_lr": 2.6540862846550967e-05, "train_wd": 0.3941673176441629, "epoch": 367}
369
+ {"train_loss": 3.95857991852301, "train_lr": 2.5001743800438792e-05, "train_wd": 0.39451889503122023, "epoch": 368}
370
+ {"train_loss": 3.946035816824789, "train_lr": 2.3509701296491925e-05, "train_wd": 0.394859707270774, "epoch": 369}
371
+ {"train_loss": 3.9312840673348886, "train_lr": 2.2064832151210218e-05, "train_wd": 0.39518973333992147, "epoch": 370}
372
+ {"train_loss": 3.918983992186191, "train_lr": 2.0667230120081943e-05, "train_wd": 0.39550895288109844, "epoch": 371}
373
+ {"train_loss": 3.9051354131776748, "train_lr": 1.931698589150017e-05, "train_wd": 0.39581734620334147, "epoch": 372}
374
+ {"train_loss": 3.8931077398079856, "train_lr": 1.801418708087777e-05, "train_wd": 0.39611489428349705, "epoch": 373}
375
+ {"train_loss": 3.880418803992508, "train_lr": 1.6758918224962656e-05, "train_wd": 0.3964015787673972, "epoch": 374}
376
+ {"train_loss": 3.868301875275864, "train_lr": 1.5551260776351905e-05, "train_wd": 0.396677381970993, "epoch": 375}
377
+ {"train_loss": 3.8559288923426878, "train_lr": 1.439129309820684e-05, "train_wd": 0.3969422868814452, "epoch": 376}
378
+ {"train_loss": 3.844095138908862, "train_lr": 1.3279090459167827e-05, "train_wd": 0.39719627715816996, "epoch": 377}
379
+ {"train_loss": 3.833755147614353, "train_lr": 1.221472502847016e-05, "train_wd": 0.3974393371338499, "epoch": 378}
380
+ {"train_loss": 3.8234637112235377, "train_lr": 1.119826587126139e-05, "train_wd": 0.39767145181540076, "epoch": 379}
381
+ {"train_loss": 3.8115567668117016, "train_lr": 1.0229778944119592e-05, "train_wd": 0.39789260688489875, "epoch": 380}
382
+ {"train_loss": 3.7997617969672075, "train_lr": 9.309327090773512e-06, "train_wd": 0.39810278870045396, "epoch": 381}
383
+ {"train_loss": 3.791720137274046, "train_lr": 8.436970038024909e-06, "train_wd": 0.39830198429706287, "epoch": 382}
384
+ {"train_loss": 3.78218844834325, "train_lr": 7.612764391872827e-06, "train_wd": 0.39849018138740255, "epoch": 383}
385
+ {"train_loss": 3.773911106131441, "train_lr": 6.836763633840455e-06, "train_wd": 0.3986673683625907, "epoch": 384}
386
+ {"train_loss": 3.765788542590648, "train_lr": 6.1090181175049534e-06, "train_wd": 0.3988335342929004, "epoch": 385}
387
+ {"train_loss": 3.7587412809677643, "train_lr": 5.429575065229989e-06, "train_wd": 0.39898866892843377, "epoch": 386}
Mambar/Base/log_eval.txt ADDED
@@ -0,0 +1,100 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"train_lr": 0.0019999999999998686, "train_loss": 1.4466070055580595, "epoch": 0, "test_loss": 0.9986482056434197, "test_acc1": 75.13, "test_acc5": 92.862}
2
+ {"train_lr": 0.0019995065603657376, "train_loss": 1.0434668161513756, "epoch": 1, "test_loss": 0.9376356114664346, "test_acc1": 76.294, "test_acc5": 93.542}
3
+ {"train_lr": 0.0019980267284282105, "train_loss": 0.9873289788990939, "epoch": 2, "test_loss": 0.923421277376392, "test_acc1": 76.454, "test_acc5": 93.796}
4
+ {"train_lr": 0.001995561964603092, "train_loss": 0.9675866722929635, "epoch": 3, "test_loss": 0.9122497581155099, "test_acc1": 76.79, "test_acc5": 93.896}
5
+ {"train_lr": 0.0019921147013145773, "train_loss": 0.9584416026384222, "epoch": 4, "test_loss": 0.9089569445994808, "test_acc1": 77.056, "test_acc5": 93.798}
6
+ {"train_lr": 0.0019876883405950175, "train_loss": 0.9552205390052418, "epoch": 5, "test_loss": 0.9099927767920677, "test_acc1": 76.846, "test_acc5": 93.898}
7
+ {"train_lr": 0.0019822872507288198, "train_loss": 0.9532406216281155, "epoch": 6, "test_loss": 0.9104332297544955, "test_acc1": 77.012, "test_acc5": 93.802}
8
+ {"train_lr": 0.0019759167619387524, "train_loss": 0.9521037693315156, "epoch": 7, "test_loss": 0.9109873524712174, "test_acc1": 76.86, "test_acc5": 94.0}
9
+ {"train_lr": 0.001968583161128624, "train_loss": 0.9507114925993665, "epoch": 8, "test_loss": 0.9066692712666738, "test_acc1": 76.86, "test_acc5": 94.024}
10
+ {"train_lr": 0.001960293685677003, "train_loss": 0.9524781338266264, "epoch": 9, "test_loss": 0.9104437387507894, "test_acc1": 76.81, "test_acc5": 93.824}
11
+ {"train_lr": 0.0019510565162951365, "train_loss": 0.9495290255771606, "epoch": 10, "test_loss": 0.9116887856093819, "test_acc1": 77.004, "test_acc5": 93.946}
12
+ {"train_lr": 0.0019408807689541316, "train_loss": 0.952276282613748, "epoch": 11, "test_loss": 0.9126302357143758, "test_acc1": 76.716, "test_acc5": 93.972}
13
+ {"train_lr": 0.0019297764858882515, "train_loss": 0.9494581628133905, "epoch": 12, "test_loss": 0.9054876058302876, "test_acc1": 77.018, "test_acc5": 93.984}
14
+ {"train_lr": 0.0019177546256839834, "train_loss": 0.9493990377056042, "epoch": 13, "test_loss": 0.9109190581628429, "test_acc1": 76.814, "test_acc5": 93.95}
15
+ {"train_lr": 0.0019048270524661083, "train_loss": 0.9476947398946326, "epoch": 14, "test_loss": 0.9133258156306908, "test_acc1": 76.842, "test_acc5": 93.996}
16
+ {"train_lr": 0.0018910065241883177, "train_loss": 0.9482654405149802, "epoch": 15, "test_loss": 0.9080370630678314, "test_acc1": 76.998, "test_acc5": 94.01}
17
+ {"train_lr": 0.0018763066800438779, "train_loss": 0.9494725002368068, "epoch": 16, "test_loss": 0.905944338235099, "test_acc1": 77.014, "test_acc5": 93.882}
18
+ {"train_lr": 0.0018607420270040137, "train_loss": 0.9458706569026291, "epoch": 17, "test_loss": 0.9057662823544744, "test_acc1": 77.118, "test_acc5": 93.948}
19
+ {"train_lr": 0.001844327925502041, "train_loss": 0.9448455252286152, "epoch": 18, "test_loss": 0.905175044141767, "test_acc1": 76.982, "test_acc5": 94.034}
20
+ {"train_lr": 0.0018270805742745338, "train_loss": 0.9443815069595338, "epoch": 19, "test_loss": 0.9029456756989974, "test_acc1": 77.21, "test_acc5": 93.954}
21
+ {"train_lr": 0.0018090169943749148, "train_loss": 0.9436027390143417, "epoch": 20, "test_loss": 0.9045922391478668, "test_acc1": 77.29, "test_acc5": 93.958}
22
+ {"train_lr": 0.001790155012375684, "train_loss": 0.944116922000909, "epoch": 21, "test_loss": 0.9041723653940898, "test_acc1": 77.016, "test_acc5": 94.034}
23
+ {"train_lr": 0.00177051324277586, "train_loss": 0.9422327687370744, "epoch": 22, "test_loss": 0.9058416822682256, "test_acc1": 77.022, "test_acc5": 94.022}
24
+ {"train_lr": 0.0017501110696303821, "train_loss": 0.9405130150374822, "epoch": 23, "test_loss": 0.9026701401757158, "test_acc1": 77.074, "test_acc5": 94.004}
25
+ {"train_lr": 0.001728968627421389, "train_loss": 0.9396099315712892, "epoch": 24, "test_loss": 0.9018396499288052, "test_acc1": 77.298, "test_acc5": 93.994}
26
+ {"train_lr": 0.0017071067811865767, "train_loss": 0.937873609896855, "epoch": 25, "test_loss": 0.9013323970234303, "test_acc1": 77.234, "test_acc5": 93.982}
27
+ {"train_lr": 0.0016845471059286062, "train_loss": 0.9375435502837288, "epoch": 26, "test_loss": 0.9028796444234946, "test_acc1": 77.12, "test_acc5": 93.996}
28
+ {"train_lr": 0.001661311865323677, "train_loss": 0.936128569405959, "epoch": 27, "test_loss": 0.9027889437230346, "test_acc1": 77.14, "test_acc5": 94.052}
29
+ {"train_lr": 0.001637423989748733, "train_loss": 0.9369419205143505, "epoch": 28, "test_loss": 0.900726139278668, "test_acc1": 77.184, "test_acc5": 94.058}
30
+ {"train_lr": 0.001612907053652909, "train_loss": 0.9353348353667065, "epoch": 29, "test_loss": 0.8985611302277926, "test_acc1": 77.218, "test_acc5": 94.104}
31
+ {"train_lr": 0.0015877852522924111, "train_loss": 0.9328561898557558, "epoch": 30, "test_loss": 0.8974022410257393, "test_acc1": 77.418, "test_acc5": 93.95}
32
+ {"train_lr": 0.0015620833778521046, "train_loss": 0.932249456453552, "epoch": 31, "test_loss": 0.8966858303531662, "test_acc1": 77.276, "test_acc5": 94.104}
33
+ {"train_lr": 0.0015358267949790963, "train_loss": 0.9293551495640315, "epoch": 32, "test_loss": 0.8946124476087672, "test_acc1": 77.34, "test_acc5": 94.096}
34
+ {"train_lr": 0.0015090414157503675, "train_loss": 0.9310670386355399, "epoch": 33, "test_loss": 0.8955803721228524, "test_acc1": 77.506, "test_acc5": 93.968}
35
+ {"train_lr": 0.0014817536741017646, "train_loss": 0.9288484953132525, "epoch": 34, "test_loss": 0.8939729660863767, "test_acc1": 77.402, "test_acc5": 94.098}
36
+ {"train_lr": 0.001453990499739611, "train_loss": 0.9263577398167245, "epoch": 35, "test_loss": 0.8957835574589117, "test_acc1": 77.352, "test_acc5": 94.064}
37
+ {"train_lr": 0.0014257792915651636, "train_loss": 0.9266760200143004, "epoch": 36, "test_loss": 0.8968203218315568, "test_acc1": 77.28, "test_acc5": 94.1}
38
+ {"train_lr": 0.001397147890634744, "train_loss": 0.9265140023081007, "epoch": 37, "test_loss": 0.8933908283862921, "test_acc1": 77.518, "test_acc5": 94.104}
39
+ {"train_lr": 0.001368124552684745, "train_loss": 0.9235190664690778, "epoch": 38, "test_loss": 0.8898873118793263, "test_acc1": 77.422, "test_acc5": 94.072}
40
+ {"train_lr": 0.0013387379202453142, "train_loss": 0.9236773780665777, "epoch": 39, "test_loss": 0.8901296779513359, "test_acc1": 77.588, "test_acc5": 94.07}
41
+ {"train_lr": 0.0013090169943749093, "train_loss": 0.9207237663504318, "epoch": 40, "test_loss": 0.8891934734933516, "test_acc1": 77.514, "test_acc5": 94.116}
42
+ {"train_lr": 0.0012789911060391633, "train_loss": 0.9182166175584149, "epoch": 41, "test_loss": 0.8858269520885195, "test_acc1": 77.708, "test_acc5": 94.104}
43
+ {"train_lr": 0.0012486898871647862, "train_loss": 0.9173645869052225, "epoch": 42, "test_loss": 0.8885101267825002, "test_acc1": 77.44, "test_acc5": 94.134}
44
+ {"train_lr": 0.001218143241396569, "train_loss": 0.916096912405989, "epoch": 43, "test_loss": 0.8902927198068565, "test_acc1": 77.474, "test_acc5": 94.098}
45
+ {"train_lr": 0.0011873813145856604, "train_loss": 0.9145932729589287, "epoch": 44, "test_loss": 0.8870058516254815, "test_acc1": 77.698, "test_acc5": 94.128}
46
+ {"train_lr": 0.0011564344650402871, "train_loss": 0.912664116458849, "epoch": 45, "test_loss": 0.8873345343505635, "test_acc1": 77.624, "test_acc5": 94.072}
47
+ {"train_lr": 0.0011253332335643327, "train_loss": 0.9122917507732339, "epoch": 46, "test_loss": 0.8856200893669177, "test_acc1": 77.632, "test_acc5": 94.172}
48
+ {"train_lr": 0.001094108313318475, "train_loss": 0.910397773539358, "epoch": 47, "test_loss": 0.8842362729865877, "test_acc1": 77.53, "test_acc5": 94.174}
49
+ {"train_lr": 0.0010627905195293463, "train_loss": 0.9093155278249402, "epoch": 48, "test_loss": 0.8836193873220698, "test_acc1": 77.704, "test_acc5": 94.138}
50
+ {"train_lr": 0.0010314107590780974, "train_loss": 0.9073813133063766, "epoch": 49, "test_loss": 0.8846154072324334, "test_acc1": 77.75, "test_acc5": 94.156}
51
+ {"train_lr": 0.0009999999999999343, "train_loss": 0.9058702561380717, "epoch": 50, "test_loss": 0.8801771187035324, "test_acc1": 77.75, "test_acc5": 94.274}
52
+ {"train_lr": 0.0009685892409218651, "train_loss": 0.9051738446663963, "epoch": 51, "test_loss": 0.8796514454857468, "test_acc1": 77.998, "test_acc5": 94.168}
53
+ {"train_lr": 0.0009372094804707101, "train_loss": 0.9039470223375811, "epoch": 52, "test_loss": 0.8798540564220579, "test_acc1": 77.894, "test_acc5": 94.196}
54
+ {"train_lr": 0.0009058916866814987, "train_loss": 0.9010344147950089, "epoch": 53, "test_loss": 0.8816311460779146, "test_acc1": 77.936, "test_acc5": 94.266}
55
+ {"train_lr": 0.0008746667664356905, "train_loss": 0.9003915467734486, "epoch": 54, "test_loss": 0.88195268280061, "test_acc1": 77.726, "test_acc5": 94.238}
56
+ {"train_lr": 0.0008435655349597399, "train_loss": 0.9006210838586295, "epoch": 55, "test_loss": 0.8789188394613583, "test_acc1": 77.84, "test_acc5": 94.238}
57
+ {"train_lr": 0.0008126186854142688, "train_loss": 0.8971389905868461, "epoch": 56, "test_loss": 0.8758326512011115, "test_acc1": 78.042, "test_acc5": 94.302}
58
+ {"train_lr": 0.0007818567586034925, "train_loss": 0.8955897440165698, "epoch": 57, "test_loss": 0.8751440471243066, "test_acc1": 78.15, "test_acc5": 94.226}
59
+ {"train_lr": 0.0007513101128351359, "train_loss": 0.8941782023422822, "epoch": 58, "test_loss": 0.8766227388168539, "test_acc1": 78.038, "test_acc5": 94.308}
60
+ {"train_lr": 0.000721008893960812, "train_loss": 0.8941977030865155, "epoch": 59, "test_loss": 0.8770973546730588, "test_acc1": 78.028, "test_acc5": 94.33}
61
+ {"train_lr": 0.0006909830056250302, "train_loss": 0.8913366875342974, "epoch": 60, "test_loss": 0.874009745810038, "test_acc1": 78.104, "test_acc5": 94.19}
62
+ {"train_lr": 0.0006612620797547435, "train_loss": 0.8904609653683505, "epoch": 61, "test_loss": 0.8725910240884327, "test_acc1": 78.134, "test_acc5": 94.348}
63
+ {"train_lr": 0.0006318754473153419, "train_loss": 0.8889056299234503, "epoch": 62, "test_loss": 0.8729563420995727, "test_acc1": 78.126, "test_acc5": 94.312}
64
+ {"train_lr": 0.0006028521093652263, "train_loss": 0.8871608624042057, "epoch": 63, "test_loss": 0.871739124359987, "test_acc1": 78.072, "test_acc5": 94.282}
65
+ {"train_lr": 0.000574220708434935, "train_loss": 0.887310620711367, "epoch": 64, "test_loss": 0.8711684146881713, "test_acc1": 78.242, "test_acc5": 94.268}
66
+ {"train_lr": 0.0005460095002604524, "train_loss": 0.8851562755623675, "epoch": 65, "test_loss": 0.873956374233336, "test_acc1": 78.19, "test_acc5": 94.328}
67
+ {"train_lr": 0.0005182463258982946, "train_loss": 0.8832700116350752, "epoch": 66, "test_loss": 0.8714524007895413, "test_acc1": 78.15, "test_acc5": 94.278}
68
+ {"train_lr": 0.0004909585842496341, "train_loss": 0.88251301617359, "epoch": 67, "test_loss": 0.8716828994205236, "test_acc1": 78.168, "test_acc5": 94.308}
69
+ {"train_lr": 0.0004641732050210111, "train_loss": 0.8825136449900904, "epoch": 68, "test_loss": 0.8695587829479476, "test_acc1": 78.232, "test_acc5": 94.308}
70
+ {"train_lr": 0.0004379166221478616, "train_loss": 0.8793549460057158, "epoch": 69, "test_loss": 0.8703527761161175, "test_acc1": 78.246, "test_acc5": 94.27}
71
+ {"train_lr": 0.00041221474770750024, "train_loss": 0.8775566902117304, "epoch": 70, "test_loss": 0.8676054321820169, "test_acc1": 78.172, "test_acc5": 94.35}
72
+ {"train_lr": 0.0003870929463470055, "train_loss": 0.877269076118696, "epoch": 71, "test_loss": 0.8675923489243783, "test_acc1": 78.392, "test_acc5": 94.308}
73
+ {"train_lr": 0.0003625760102513295, "train_loss": 0.8769359756834118, "epoch": 72, "test_loss": 0.867548253168078, "test_acc1": 78.306, "test_acc5": 94.354}
74
+ {"train_lr": 0.0003386881346763327, "train_loss": 0.8751998166447632, "epoch": 73, "test_loss": 0.8682303870730388, "test_acc1": 78.286, "test_acc5": 94.304}
75
+ {"train_lr": 0.0003154528940713109, "train_loss": 0.8748905586270014, "epoch": 74, "test_loss": 0.8682153877775992, "test_acc1": 78.294, "test_acc5": 94.346}
76
+ {"train_lr": 0.00029289321881343744, "train_loss": 0.873052065750741, "epoch": 75, "test_loss": 0.8663290569087123, "test_acc1": 78.376, "test_acc5": 94.37}
77
+ {"train_lr": 0.0002710313725785874, "train_loss": 0.8718183263779116, "epoch": 76, "test_loss": 0.8659734769779093, "test_acc1": 78.44, "test_acc5": 94.374}
78
+ {"train_lr": 0.0002498889303695469, "train_loss": 0.8718300200716, "epoch": 77, "test_loss": 0.8652986242719318, "test_acc1": 78.408, "test_acc5": 94.364}
79
+ {"train_lr": 0.0002294867572242191, "train_loss": 0.8703978585627762, "epoch": 78, "test_loss": 0.8650836781848728, "test_acc1": 78.522, "test_acc5": 94.384}
80
+ {"train_lr": 0.0002098449876243195, "train_loss": 0.8691956093560873, "epoch": 79, "test_loss": 0.8659568168699284, "test_acc1": 78.362, "test_acc5": 94.352}
81
+ {"train_lr": 0.00019098300562504553, "train_loss": 0.8691677808184125, "epoch": 80, "test_loss": 0.8653898394626119, "test_acc1": 78.402, "test_acc5": 94.364}
82
+ {"train_lr": 0.00017291942572544524, "train_loss": 0.8679120109032927, "epoch": 81, "test_loss": 0.8641006554407842, "test_acc1": 78.518, "test_acc5": 94.338}
83
+ {"train_lr": 0.0001556720744979767, "train_loss": 0.8682523868022516, "epoch": 82, "test_loss": 0.8647359752136728, "test_acc1": 78.464, "test_acc5": 94.382}
84
+ {"train_lr": 0.00013925797299606019, "train_loss": 0.8648756306307391, "epoch": 83, "test_loss": 0.8636470552143234, "test_acc1": 78.482, "test_acc5": 94.388}
85
+ {"train_lr": 0.00012369331995613583, "train_loss": 0.8643114578233354, "epoch": 84, "test_loss": 0.8636927481959847, "test_acc1": 78.484, "test_acc5": 94.394}
86
+ {"train_lr": 0.00010899347581163435, "train_loss": 0.8645053450263742, "epoch": 85, "test_loss": 0.8635647471451089, "test_acc1": 78.478, "test_acc5": 94.374}
87
+ {"train_lr": 9.5172947533978e-05, "train_loss": 0.8618958545353858, "epoch": 86, "test_loss": 0.8634990527273139, "test_acc1": 78.486, "test_acc5": 94.374}
88
+ {"train_lr": 8.224537431602316e-05, "train_loss": 0.8638592543622945, "epoch": 87, "test_loss": 0.8623975143789331, "test_acc1": 78.512, "test_acc5": 94.358}
89
+ {"train_lr": 7.022351411175157e-05, "train_loss": 0.8631021135117929, "epoch": 88, "test_loss": 0.8629720954181593, "test_acc1": 78.548, "test_acc5": 94.368}
90
+ {"train_lr": 5.911923104577377e-05, "train_loss": 0.8618255903690613, "epoch": 89, "test_loss": 0.8628521017406298, "test_acc1": 78.52, "test_acc5": 94.39}
91
+ {"train_lr": 4.8943483704848814e-05, "train_loss": 0.8617792921308227, "epoch": 90, "test_loss": 0.8626455465698486, "test_acc1": 78.536, "test_acc5": 94.384}
92
+ {"train_lr": 3.9706314323055196e-05, "train_loss": 0.8601736509223676, "epoch": 91, "test_loss": 0.862741590079749, "test_acc1": 78.518, "test_acc5": 94.392}
93
+ {"train_lr": 3.141683887136792e-05, "train_loss": 0.8606807779173969, "epoch": 92, "test_loss": 0.8627357340758414, "test_acc1": 78.496, "test_acc5": 94.406}
94
+ {"train_lr": 2.4083238061252423e-05, "train_loss": 0.860788486891992, "epoch": 93, "test_loss": 0.8624967259671682, "test_acc1": 78.52, "test_acc5": 94.392}
95
+ {"train_lr": 1.7712749271312274e-05, "train_loss": 0.8586979743615656, "epoch": 94, "test_loss": 0.8624637805668595, "test_acc1": 78.516, "test_acc5": 94.402}
96
+ {"train_lr": 1.2311659404861753e-05, "train_loss": 0.8585625850542326, "epoch": 95, "test_loss": 0.8623979722371187, "test_acc1": 78.51, "test_acc5": 94.39}
97
+ {"train_lr": 7.885298685522277e-06, "train_loss": 0.8593257459768333, "epoch": 96, "test_loss": 0.8624408127706679, "test_acc1": 78.514, "test_acc5": 94.392}
98
+ {"train_lr": 4.4380353969200165e-06, "train_loss": 0.8585100486082788, "epoch": 97, "test_loss": 0.8624630375667606, "test_acc1": 78.512, "test_acc5": 94.404}
99
+ {"train_lr": 1.9732715717283947e-06, "train_loss": 0.8577373142283867, "epoch": 98, "test_loss": 0.8624525259599052, "test_acc1": 78.506, "test_acc5": 94.404}
100
+ {"train_lr": 4.934396342684219e-07, "train_loss": 0.8601024688016496, "epoch": 99, "test_loss": 0.862451644847765, "test_acc1": 78.51, "test_acc5": 94.406}
Vim/Base/checkpoint.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e80c016e2332a465cb7b00b7c5a66fb65717cd16a014f209bda24fa407c6cc5
3
+ size 1794135568
Vim/Base/checkpoint.pth.tar ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c2fa0df22fe13feff9358f38d2e092566ceaeb624f3c6dce20b25296b85ae2c
3
+ size 49162696
Vim/Base/config.txt ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ arch: vim_base_patch16_224
2
+ batch_size_per_gpu: 32
3
+ clip_grad: 3.0
4
+ drop_path_rate: 0.1
5
+ epochs: 400
6
+ freeze_last_layer: 3
7
+ global_crops_scale: (0.25, 1.0)
8
+ gpu: 0
9
+ local_crops_number: 10
10
+ local_crops_scale: (0.05, 0.25)
11
+ local_rank: 0
12
+ lr: 0.00075
13
+ min_lr: 1e-06
14
+ momentum_teacher: 0.996
15
+ ngpus: 8
16
+ nodes: 3
17
+ norm_last_layer: True
18
+ num_workers: 10
19
+ optimizer: adamw
20
+ out_dim: 65536
21
+ partition: main
22
+ patch_size: 16
23
+ rank: 0
24
+ saveckp_freq: 5
25
+ seed: 0
26
+ teacher_temp: 0.07
27
+ use_bn_in_head: False
28
+ use_fp16: True (bf16)
29
+ use_volta32: False
30
+ warmup_epochs: 10
31
+ warmup_teacher_temp: 0.04
32
+ warmup_teacher_temp_epochs: 50
33
+ weight_decay: 0.04
34
+ weight_decay_end: 0.4
35
+ world_size: 24
Vim/Base/log.txt ADDED
@@ -0,0 +1,400 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"train_loss": 8.791311841550396, "train_lr": 0.00011243929492175784, "train_wd": 0.0400018488812943, "epoch": 0}
2
+ {"train_loss": 5.462759949147797, "train_lr": 0.00033745278493914506, "train_wd": 0.040012948686810525, "epoch": 1}
3
+ {"train_loss": 4.988951792498287, "train_lr": 0.0005624662749565324, "train_wd": 0.04003515094146663, "epoch": 2}
4
+ {"train_loss": 8.64678563664464, "train_lr": 0.0007874797649739196, "train_wd": 0.04006845427572264, "epoch": 3}
5
+ {"train_loss": 7.653681282886117, "train_lr": 0.0010124932549913067, "train_wd": 0.040112856635272226, "epoch": 4}
6
+ {"train_loss": 6.094493289574159, "train_lr": 0.0012375067450086943, "train_wd": 0.04016835528116863, "epoch": 5}
7
+ {"train_loss": 5.40798800098572, "train_lr": 0.0014625202350260808, "train_wd": 0.04023494678999399, "epoch": 6}
8
+ {"train_loss": 5.0472661788455495, "train_lr": 0.0016875337250434681, "train_wd": 0.040312627054070405, "epoch": 7}
9
+ {"train_loss": 4.793536900872473, "train_lr": 0.0019125472150608547, "train_wd": 0.040401391281713196, "epoch": 8}
10
+ {"train_loss": 4.606703310799923, "train_lr": 0.002137560705078243, "train_wd": 0.04050123399752657, "epoch": 9}
11
+ {"train_loss": 4.454039123507855, "train_lr": 0.0022499878497089162, "train_wd": 0.04061214904274183, "epoch": 10}
12
+ {"train_loss": 4.324510647458948, "train_lr": 0.0022499149051764637, "train_wd": 0.04073412957559615, "epoch": 11}
13
+ {"train_loss": 4.2179946069725505, "train_lr": 0.0022497689989721655, "train_wd": 0.04086716807175613, "epoch": 12}
14
+ {"train_loss": 4.13319051213902, "train_lr": 0.0022495501405636583, "train_wd": 0.04101125632478038, "epoch": 13}
15
+ {"train_loss": 4.063291063953599, "train_lr": 0.0022492583441523595, "train_wd": 0.04116638544662668, "epoch": 14}
16
+ {"train_loss": 4.00746581589075, "train_lr": 0.0022488936286725212, "train_wd": 0.041332545868200114, "epoch": 15}
17
+ {"train_loss": 3.9581959288564326, "train_lr": 0.0022484560177899954, "train_wd": 0.04150972733994341, "epoch": 16}
18
+ {"train_loss": 3.9184228530366547, "train_lr": 0.0022479455399007442, "train_wd": 0.04169791893246864, "epoch": 17}
19
+ {"train_loss": 3.8849882615818014, "train_lr": 0.002247362228128924, "train_wd": 0.04189710903723169, "epoch": 18}
20
+ {"train_loss": 3.860449588377413, "train_lr": 0.0022467061203248154, "train_wd": 0.042107285367249066, "epoch": 19}
21
+ {"train_loss": 3.8383745298349408, "train_lr": 0.0022459772590623147, "train_wd": 0.04232843495785438, "epoch": 20}
22
+ {"train_loss": 3.824272158888461, "train_lr": 0.0022451756916361826, "train_wd": 0.042560544167499416, "epoch": 21}
23
+ {"train_loss": 3.8089843666036542, "train_lr": 0.002244301470058971, "train_wd": 0.04280359867859451, "epoch": 22}
24
+ {"train_loss": 3.79720155734548, "train_lr": 0.0022433546510576734, "train_wd": 0.043057583498392824, "epoch": 23}
25
+ {"train_loss": 3.7873032834532734, "train_lr": 0.0022423352960700134, "train_wd": 0.043322482959913984, "epoch": 24}
26
+ {"train_loss": 3.783618225140585, "train_lr": 0.002241243471240486, "train_wd": 0.0435982807229118, "epoch": 25}
27
+ {"train_loss": 3.780716408047078, "train_lr": 0.0022400792474160285, "train_wd": 0.0438849597748808, "epoch": 26}
28
+ {"train_loss": 3.779477525273149, "train_lr": 0.0022388427001414643, "train_wd": 0.04418250243210681, "epoch": 27}
29
+ {"train_loss": 3.7802207430275225, "train_lr": 0.0022375339096545595, "train_wd": 0.044490890340757094, "epoch": 28}
30
+ {"train_loss": 3.7850068895210276, "train_lr": 0.002236152960880873, "train_wd": 0.04481010447801298, "epoch": 29}
31
+ {"train_loss": 3.78894633528807, "train_lr": 0.0022346999434281834, "train_wd": 0.04514012515324267, "epoch": 30}
32
+ {"train_loss": 3.7957354486703303, "train_lr": 0.002233174951580708, "train_wd": 0.045480932009216435, "epoch": 31}
33
+ {"train_loss": 3.8062724955945755, "train_lr": 0.0022315780842929855, "train_wd": 0.04583250402336228, "epoch": 32}
34
+ {"train_loss": 3.8167687443365677, "train_lr": 0.002229909445183446, "train_wd": 0.04619481950906189, "epoch": 33}
35
+ {"train_loss": 3.828850667801597, "train_lr": 0.0022281691425276857, "train_wd": 0.04656785611698974, "epoch": 34}
36
+ {"train_loss": 3.8442154121782472, "train_lr": 0.0022263572892514535, "train_wd": 0.04695159083649067, "epoch": 35}
37
+ {"train_loss": 3.8620184283438537, "train_lr": 0.0022244740029233163, "train_wd": 0.04734599999699968, "epoch": 36}
38
+ {"train_loss": 3.881701397929165, "train_lr": 0.0022225194057470137, "train_wd": 0.04775105926950166, "epoch": 37}
39
+ {"train_loss": 3.9013140438188563, "train_lr": 0.0022204936245535647, "train_wd": 0.04816674366803294, "epoch": 38}
40
+ {"train_loss": 3.922961272906771, "train_lr": 0.0022183967907930054, "train_wd": 0.048593027551221725, "epoch": 39}
41
+ {"train_loss": 3.9491374919728504, "train_lr": 0.0022162290405258753, "train_wd": 0.049029884623870014, "epoch": 40}
42
+ {"train_loss": 3.991124549244853, "train_lr": 0.002213990514414376, "train_wd": 0.04947728793857585, "epoch": 41}
43
+ {"train_loss": 4.016615633728454, "train_lr": 0.0022116813577132653, "train_wd": 0.0499352098973953, "epoch": 42}
44
+ {"train_loss": 4.068125319727462, "train_lr": 0.002209301720260418, "train_wd": 0.05040362225354507, "epoch": 43}
45
+ {"train_loss": 4.1491790337504435, "train_lr": 0.0022068517564670874, "train_wd": 0.0508824961131445, "epoch": 44}
46
+ {"train_loss": 4.247970356667738, "train_lr": 0.002204331625307916, "train_wd": 0.05137180193699805, "epoch": 45}
47
+ {"train_loss": 4.3383591155663765, "train_lr": 0.0022017414903106086, "train_wd": 0.05187150954241808, "epoch": 46}
48
+ {"train_loss": 4.426528246151648, "train_lr": 0.0021990815195453064, "train_wd": 0.05238158810508532, "epoch": 47}
49
+ {"train_loss": 4.504598460454258, "train_lr": 0.0021963518856136996, "train_wd": 0.05290200616095152, "epoch": 48}
50
+ {"train_loss": 4.5765051458307875, "train_lr": 0.0021935527656378254, "train_wd": 0.0534327316081796, "epoch": 49}
51
+ {"train_loss": 4.597023761553539, "train_lr": 0.002190684341248574, "train_wd": 0.05397373170912373, "epoch": 50}
52
+ {"train_loss": 4.611929891361512, "train_lr": 0.002187746798573889, "train_wd": 0.05452497309234971, "epoch": 51}
53
+ {"train_loss": 4.6223640464109295, "train_lr": 0.0021847403282266916, "train_wd": 0.05508642175469238, "epoch": 52}
54
+ {"train_loss": 4.619651290694539, "train_lr": 0.002181665125292556, "train_wd": 0.05565804306335362, "epoch": 53}
55
+ {"train_loss": 4.617645353299203, "train_lr": 0.002178521389316987, "train_wd": 0.05623980175803826, "epoch": 54}
56
+ {"train_loss": 4.635732807635928, "train_lr": 0.002175309324292497, "train_wd": 0.05683166195313003, "epoch": 55}
57
+ {"train_loss": 4.679225808865637, "train_lr": 0.0021720291386453914, "train_wd": 0.057433587139903916, "epoch": 56}
58
+ {"train_loss": 4.735275753360572, "train_lr": 0.0021686810452222105, "train_wd": 0.05804554018877921, "epoch": 57}
59
+ {"train_loss": 4.7726854803345855, "train_lr": 0.002165265261275944, "train_wd": 0.058667483351609144, "epoch": 58}
60
+ {"train_loss": 4.785418109469515, "train_lr": 0.002161782008451921, "train_wd": 0.059299378264010244, "epoch": 59}
61
+ {"train_loss": 4.796479801289278, "train_lr": 0.002158231512773408, "train_wd": 0.059941185947727224, "epoch": 60}
62
+ {"train_loss": 4.8058015219718335, "train_lr": 0.0021546140046269984, "train_wd": 0.06059286681303961, "epoch": 61}
63
+ {"train_loss": 4.814654995527246, "train_lr": 0.0021509297187476102, "train_wd": 0.06125438066120149, "epoch": 62}
64
+ {"train_loss": 4.82154249141423, "train_lr": 0.002147178894203261, "train_wd": 0.06192568668692288, "epoch": 63}
65
+ {"train_loss": 4.819661550378676, "train_lr": 0.002143361774379599, "train_wd": 0.06260674348088577, "epoch": 64}
66
+ {"train_loss": 4.823709943537994, "train_lr": 0.0021394786069640456, "train_wd": 0.06329750903229917, "epoch": 65}
67
+ {"train_loss": 4.825584393682526, "train_lr": 0.0021355296439297764, "train_wd": 0.06399794073149012, "epoch": 66}
68
+ {"train_loss": 4.8274447081579295, "train_lr": 0.0021315151415193436, "train_wd": 0.06470799537253205, "epoch": 67}
69
+ {"train_loss": 4.829449153459853, "train_lr": 0.0021274353602280514, "train_wd": 0.0654276291559101, "epoch": 68}
70
+ {"train_loss": 4.830739360109127, "train_lr": 0.0021232905647870603, "train_wd": 0.06615679769122293, "epoch": 69}
71
+ {"train_loss": 4.830983481908159, "train_lr": 0.002119081024146212, "train_wd": 0.06689545599991996, "epoch": 70}
72
+ {"train_loss": 4.833181741146399, "train_lr": 0.0021148070114565664, "train_wd": 0.06764355851807788, "epoch": 71}
73
+ {"train_loss": 4.832191391707324, "train_lr": 0.002110468804052679, "train_wd": 0.06840105909920928, "epoch": 72}
74
+ {"train_loss": 4.833065345186553, "train_lr": 0.002106066683434609, "train_wd": 0.06916791101711027, "epoch": 73}
75
+ {"train_loss": 4.837334010139596, "train_lr": 0.002101600935249654, "train_wd": 0.06994406696874236, "epoch": 74}
76
+ {"train_loss": 4.835683083964242, "train_lr": 0.0020970718492738225, "train_wd": 0.07072947907715031, "epoch": 75}
77
+ {"train_loss": 4.838766262691608, "train_lr": 0.0020924797193930117, "train_wd": 0.07152409889441551, "epoch": 76}
78
+ {"train_loss": 4.844726546616148, "train_lr": 0.002087824843583941, "train_wd": 0.07232787740464512, "epoch": 77}
79
+ {"train_loss": 4.846732470724318, "train_lr": 0.0020831075238948375, "train_wd": 0.07314076502699401, "epoch": 78}
80
+ {"train_loss": 4.849938967793013, "train_lr": 0.00207832806642581, "train_wd": 0.07396271161872502, "epoch": 79}
81
+ {"train_loss": 4.8508237060025445, "train_lr": 0.002073486781309009, "train_wd": 0.0747936664783003, "epoch": 80}
82
+ {"train_loss": 4.85264684552912, "train_lr": 0.0020685839826884915, "train_wd": 0.07563357834851012, "epoch": 81}
83
+ {"train_loss": 4.8577792402937545, "train_lr": 0.00206361998869982, "train_wd": 0.07648239541963398, "epoch": 82}
84
+ {"train_loss": 4.862185284179701, "train_lr": 0.002058595121449471, "train_wd": 0.07734006533263661, "epoch": 83}
85
+ {"train_loss": 4.864996193660249, "train_lr": 0.0020535097069938665, "train_wd": 0.07820653518239781, "epoch": 84}
86
+ {"train_loss": 4.868034026248278, "train_lr": 0.002048364075318258, "train_wd": 0.07908175152097584, "epoch": 85}
87
+ {"train_loss": 4.874134428948045, "train_lr": 0.0020431585603153187, "train_wd": 0.07996566036090431, "epoch": 86}
88
+ {"train_loss": 4.878877576455462, "train_lr": 0.0020378934997634644, "train_wd": 0.0808582071785224, "epoch": 87}
89
+ {"train_loss": 4.880632186351682, "train_lr": 0.002032569235304918, "train_wd": 0.08175933691733812, "epoch": 88}
90
+ {"train_loss": 4.886346240177286, "train_lr": 0.0020271861124235707, "train_wd": 0.08266899399142386, "epoch": 89}
91
+ {"train_loss": 4.889256202345558, "train_lr": 0.002021744480422558, "train_wd": 0.08358712228884768, "epoch": 90}
92
+ {"train_loss": 4.891181801392925, "train_lr": 0.0020162446924015765, "train_wd": 0.0845136651751305, "epoch": 91}
93
+ {"train_loss": 4.897939390487236, "train_lr": 0.0020106871052339914, "train_wd": 0.08544856549674296, "epoch": 92}
94
+ {"train_loss": 4.899022969011542, "train_lr": 0.0020050720795436734, "train_wd": 0.08639176558462944, "epoch": 93}
95
+ {"train_loss": 4.902116217612505, "train_lr": 0.001999399979681586, "train_wd": 0.08734320725776569, "epoch": 94}
96
+ {"train_loss": 4.905756883960453, "train_lr": 0.001993671173702164, "train_wd": 0.0883028318267475, "epoch": 95}
97
+ {"train_loss": 4.907479024387235, "train_lr": 0.0019878860333394205, "train_wd": 0.08927058009741136, "epoch": 96}
98
+ {"train_loss": 4.910941307058485, "train_lr": 0.001982044933982823, "train_wd": 0.09024639237448524, "epoch": 97}
99
+ {"train_loss": 4.912565750898503, "train_lr": 0.001976148254652931, "train_wd": 0.09123020846527136, "epoch": 98}
100
+ {"train_loss": 4.915782493456519, "train_lr": 0.0019701963779768248, "train_wd": 0.09222196768335969, "epoch": 99}
101
+ {"train_loss": 4.9192635208713735, "train_lr": 0.0019641896901632493, "train_wd": 0.09322160885236916, "epoch": 100}
102
+ {"train_loss": 4.92194232094488, "train_lr": 0.001958128580977568, "train_wd": 0.09422907030972458, "epoch": 101}
103
+ {"train_loss": 4.927125146718239, "train_lr": 0.001952013443716468, "train_wd": 0.09524428991045686, "epoch": 102}
104
+ {"train_loss": 4.929888047581668, "train_lr": 0.0019458446751824453, "train_wd": 0.0962672050310395, "epoch": 103}
105
+ {"train_loss": 4.932969900540454, "train_lr": 0.0019396226756580488, "train_wd": 0.09729775257324913, "epoch": 104}
106
+ {"train_loss": 4.935349319210585, "train_lr": 0.0019333478488799186, "train_wd": 0.0983358689680596, "epoch": 105}
107
+ {"train_loss": 4.938486134810604, "train_lr": 0.001927020602012559, "train_wd": 0.09938149017956104, "epoch": 106}
108
+ {"train_loss": 4.944360662451227, "train_lr": 0.001920641345621957, "train_wd": 0.10043455170891225, "epoch": 107}
109
+ {"train_loss": 4.946000228748381, "train_lr": 0.0019142104936489264, "train_wd": 0.10149498859831774, "epoch": 108}
110
+ {"train_loss": 4.94768348486899, "train_lr": 0.0019077284633822254, "train_wd": 0.10256273543503483, "epoch": 109}
111
+ {"train_loss": 4.952008490302532, "train_lr": 0.0019011956754315165, "train_wd": 0.1036377263554089, "epoch": 110}
112
+ {"train_loss": 4.956965806994507, "train_lr": 0.0018946125537000359, "train_wd": 0.10471989504893713, "epoch": 111}
113
+ {"train_loss": 4.95753159006532, "train_lr": 0.0018879795253571349, "train_wd": 0.10580917476235611, "epoch": 112}
114
+ {"train_loss": 4.961063407915388, "train_lr": 0.001881297020810505, "train_wd": 0.10690549830376252, "epoch": 113}
115
+ {"train_loss": 4.96400594280111, "train_lr": 0.001874565473678295, "train_wd": 0.10800879804675649, "epoch": 114}
116
+ {"train_loss": 4.964787129947036, "train_lr": 0.00186778532076095, "train_wd": 0.10911900593461249, "epoch": 115}
117
+ {"train_loss": 4.964636370682602, "train_lr": 0.0018609570020128815, "train_wd": 0.1102360534844788, "epoch": 116}
118
+ {"train_loss": 4.969423674297133, "train_lr": 0.0018540809605138995, "train_wd": 0.11135987179160022, "epoch": 117}
119
+ {"train_loss": 4.971901504345221, "train_lr": 0.0018471576424404846, "train_wd": 0.11249039153357049, "epoch": 118}
120
+ {"train_loss": 4.975119516986022, "train_lr": 0.0018401874970368302, "train_wd": 0.11362754297460619, "epoch": 119}
121
+ {"train_loss": 4.977751396703634, "train_lr": 0.001833170976585681, "train_wd": 0.11477125596985009, "epoch": 120}
122
+ {"train_loss": 4.978540643269448, "train_lr": 0.001826108536378989, "train_wd": 0.11592145996969742, "epoch": 121}
123
+ {"train_loss": 4.989607562549966, "train_lr": 0.001819000634688385, "train_wd": 0.11707808402414822, "epoch": 122}
124
+ {"train_loss": 4.981191045624747, "train_lr": 0.0018118477327354254, "train_wd": 0.11824105678718107, "epoch": 123}
125
+ {"train_loss": 4.985796501078337, "train_lr": 0.001804650294661658, "train_wd": 0.11941030652115958, "epoch": 124}
126
+ {"train_loss": 4.9872467668531995, "train_lr": 0.0017974087874985285, "train_wd": 0.12058576110125113, "epoch": 125}
127
+ {"train_loss": 4.99069191080084, "train_lr": 0.0017901236811370637, "train_wd": 0.12176734801988053, "epoch": 126}
128
+ {"train_loss": 4.993084243554577, "train_lr": 0.0017827954482973738, "train_wd": 0.12295499439120157, "epoch": 127}
129
+ {"train_loss": 5.000670218704749, "train_lr": 0.0017754245644979866, "train_wd": 0.12414862695559117, "epoch": 128}
130
+ {"train_loss": 4.995278656750703, "train_lr": 0.0017680115080249844, "train_wd": 0.12534817208417057, "epoch": 129}
131
+ {"train_loss": 4.999131863756622, "train_lr": 0.0017605567599009858, "train_wd": 0.12655355578334548, "epoch": 130}
132
+ {"train_loss": 5.0022163943504445, "train_lr": 0.0017530608038539043, "train_wd": 0.12776470369937215, "epoch": 131}
133
+ {"train_loss": 5.002891992154024, "train_lr": 0.0017455241262855897, "train_wd": 0.12898154112294136, "epoch": 132}
134
+ {"train_loss": 5.005699484063377, "train_lr": 0.0017379472162402502, "train_wd": 0.13020399299378943, "epoch": 133}
135
+ {"train_loss": 5.009675585638752, "train_lr": 0.0017303305653727217, "train_wd": 0.13143198390532637, "epoch": 134}
136
+ {"train_loss": 5.010137212683829, "train_lr": 0.0017226746679165615, "train_wd": 0.13266543810928916, "epoch": 135}
137
+ {"train_loss": 5.0134468773941245, "train_lr": 0.0017149800206519871, "train_wd": 0.13390427952041153, "epoch": 136}
138
+ {"train_loss": 5.0174342189118155, "train_lr": 0.0017072471228736295, "train_wd": 0.13514843172112007, "epoch": 137}
139
+ {"train_loss": 5.018784061628137, "train_lr": 0.0016994764763581395, "train_wd": 0.13639781796624673, "epoch": 138}
140
+ {"train_loss": 5.020582273953872, "train_lr": 0.0016916685853316453, "train_wd": 0.13765236118776253, "epoch": 139}
141
+ {"train_loss": 5.0213374859935564, "train_lr": 0.001683823956436995, "train_wd": 0.13891198399953267, "epoch": 140}
142
+ {"train_loss": 5.022324731190809, "train_lr": 0.0016759430987009225, "train_wd": 0.1401766087020883, "epoch": 141}
143
+ {"train_loss": 5.02517630914442, "train_lr": 0.0016680265235009945, "train_wd": 0.14144615728742047, "epoch": 142}
144
+ {"train_loss": 5.026830006661794, "train_lr": 0.0016600747445324265, "train_wd": 0.14272055144379325, "epoch": 143}
145
+ {"train_loss": 5.027395590365552, "train_lr": 0.0016520882777747573, "train_wd": 0.14399971256057137, "epoch": 144}
146
+ {"train_loss": 5.032108405302707, "train_lr": 0.0016440676414583798, "train_wd": 0.1452835617330724, "epoch": 145}
147
+ {"train_loss": 5.034408041702615, "train_lr": 0.0016360133560308762, "train_wd": 0.14657201976743112, "epoch": 146}
148
+ {"train_loss": 5.035408462289807, "train_lr": 0.001627925944123296, "train_wd": 0.14786500718548767, "epoch": 147}
149
+ {"train_loss": 5.037028235133937, "train_lr": 0.001619805930516211, "train_wd": 0.14916244422968705, "epoch": 148}
150
+ {"train_loss": 5.035588470449169, "train_lr": 0.0016116538421056612, "train_wd": 0.15046425086800097, "epoch": 149}
151
+ {"train_loss": 5.038466708539582, "train_lr": 0.0016034702078689797, "train_wd": 0.15177034679886398, "epoch": 150}
152
+ {"train_loss": 5.0407271008435295, "train_lr": 0.0015952555588304694, "train_wd": 0.15308065145612665, "epoch": 151}
153
+ {"train_loss": 5.04209598876256, "train_lr": 0.0015870104280269347, "train_wd": 0.15439508401402596, "epoch": 152}
154
+ {"train_loss": 5.043704204267259, "train_lr": 0.0015787353504730915, "train_wd": 0.15571356339217005, "epoch": 153}
155
+ {"train_loss": 5.041929824984998, "train_lr": 0.0015704308631268697, "train_wd": 0.15703600826054048, "epoch": 154}
156
+ {"train_loss": 5.045829544029981, "train_lr": 0.0015620975048545515, "train_wd": 0.15836233704450803, "epoch": 155}
157
+ {"train_loss": 5.048496541823987, "train_lr": 0.00155373581639581, "train_wd": 0.1596924679298659, "epoch": 156}
158
+ {"train_loss": 5.048377593936061, "train_lr": 0.0015453463403286303, "train_wd": 0.16102631886787566, "epoch": 157}
159
+ {"train_loss": 5.0482297805692555, "train_lr": 0.001536929621034091, "train_wd": 0.162363807580329, "epoch": 158}
160
+ {"train_loss": 5.0515888200687185, "train_lr": 0.0015284862046610389, "train_wd": 0.163704851564621, "epoch": 159}
161
+ {"train_loss": 5.052292874146946, "train_lr": 0.0015200166390906724, "train_wd": 0.16504936809884233, "epoch": 160}
162
+ {"train_loss": 5.052882967306841, "train_lr": 0.0015115214739009571, "train_wd": 0.16639727424688008, "epoch": 161}
163
+ {"train_loss": 5.053132421172542, "train_lr": 0.0015030012603309917, "train_wd": 0.16774848686353355, "epoch": 162}
164
+ {"train_loss": 5.056654157720024, "train_lr": 0.0014944565512452252, "train_wd": 0.16910292259964443, "epoch": 163}
165
+ {"train_loss": 5.0565715535319775, "train_lr": 0.001485887901097584, "train_wd": 0.17046049790723505, "epoch": 164}
166
+ {"train_loss": 5.057663604891081, "train_lr": 0.0014772958658954961, "train_wd": 0.1718211290446672, "epoch": 165}
167
+ {"train_loss": 5.058639786500248, "train_lr": 0.0014686810031638103, "train_wd": 0.17318473208180246, "epoch": 166}
168
+ {"train_loss": 5.059489585727238, "train_lr": 0.0014600438719086313, "train_wd": 0.17455122290518255, "epoch": 167}
169
+ {"train_loss": 5.059578287468064, "train_lr": 0.001451385032581021, "train_wd": 0.17592051722321678, "epoch": 168}
170
+ {"train_loss": 5.062086945338596, "train_lr": 0.001442705047040657, "train_wd": 0.17729253057138175, "epoch": 169}
171
+ {"train_loss": 5.061082455644504, "train_lr": 0.0014340044785193695, "train_wd": 0.1786671783174312, "epoch": 170}
172
+ {"train_loss": 5.062198684840418, "train_lr": 0.0014252838915845686, "train_wd": 0.1800443756666165, "epoch": 171}
173
+ {"train_loss": 5.063558317357592, "train_lr": 0.0014165438521026492, "train_wd": 0.1814240376669191, "epoch": 172}
174
+ {"train_loss": 5.066216586567134, "train_lr": 0.0014077849272022555, "train_wd": 0.18280607921428652, "epoch": 173}
175
+ {"train_loss": 5.066024520932484, "train_lr": 0.00139900768523746, "train_wd": 0.18419041505788783, "epoch": 174}
176
+ {"train_loss": 5.064372020582263, "train_lr": 0.0013902126957509246, "train_wd": 0.18557695980536645, "epoch": 175}
177
+ {"train_loss": 5.064834684389624, "train_lr": 0.0013814005294369043, "train_wd": 0.186965627928111, "epoch": 176}
178
+ {"train_loss": 5.064027204936881, "train_lr": 0.0013725717581042547, "train_wd": 0.18835633376653085, "epoch": 177}
179
+ {"train_loss": 5.064920329313865, "train_lr": 0.0013637269546392867, "train_wd": 0.18974899153533897, "epoch": 178}
180
+ {"train_loss": 5.068584239698476, "train_lr": 0.0013548666929686277, "train_wd": 0.19114351532884466, "epoch": 179}
181
+ {"train_loss": 5.062858798544851, "train_lr": 0.001345991548021954, "train_wd": 0.1925398191262502, "epoch": 180}
182
+ {"train_loss": 5.063442324360402, "train_lr": 0.0013371020956947025, "train_wd": 0.19393781679696118, "epoch": 181}
183
+ {"train_loss": 5.063762116906264, "train_lr": 0.0013281989128107092, "train_wd": 0.1953374221058965, "epoch": 182}
184
+ {"train_loss": 5.0623575256084745, "train_lr": 0.0013192825770847309, "train_wd": 0.196738548718807, "epoch": 183}
185
+ {"train_loss": 5.063648986409036, "train_lr": 0.0013103536670850343, "train_wd": 0.19814111020760444, "epoch": 184}
186
+ {"train_loss": 5.064735740179019, "train_lr": 0.0013014127621957833, "train_wd": 0.19954502005568794, "epoch": 185}
187
+ {"train_loss": 5.063962829675225, "train_lr": 0.0012924604425794894, "train_wd": 0.20095019166328626, "epoch": 186}
188
+ {"train_loss": 5.063437647027649, "train_lr": 0.0012834972891393362, "train_wd": 0.2023565383527955, "epoch": 187}
189
+ {"train_loss": 5.0641190597622225, "train_lr": 0.0012745238834815133, "train_wd": 0.203763973374127, "epoch": 188}
190
+ {"train_loss": 5.063902675587354, "train_lr": 0.0012655408078774484, "train_wd": 0.2051724099100601, "epoch": 189}
191
+ {"train_loss": 5.065132150433952, "train_lr": 0.0012565486452260468, "train_wd": 0.20658176108159315, "epoch": 190}
192
+ {"train_loss": 5.065777538324908, "train_lr": 0.0012475479790158568, "train_wd": 0.2079919399533085, "epoch": 191}
193
+ {"train_loss": 5.064099990599733, "train_lr": 0.0012385393932872097, "train_wd": 0.2094028595387305, "epoch": 192}
194
+ {"train_loss": 5.063579307620426, "train_lr": 0.0012295234725943252, "train_wd": 0.21081443280569376, "epoch": 193}
195
+ {"train_loss": 5.061584196168837, "train_lr": 0.0012205008019673723, "train_wd": 0.21222657268170894, "epoch": 194}
196
+ {"train_loss": 5.062155795647658, "train_lr": 0.0012114719668745244, "train_wd": 0.2136391920593371, "epoch": 195}
197
+ {"train_loss": 5.062742229440897, "train_lr": 0.0012024375531839476, "train_wd": 0.21505220380156154, "epoch": 196}
198
+ {"train_loss": 5.060796733960498, "train_lr": 0.0011933981471258025, "train_wd": 0.21646552074716072, "epoch": 197}
199
+ {"train_loss": 5.061077989554472, "train_lr": 0.0011843543352541884, "train_wd": 0.2178790557160903, "epoch": 198}
200
+ {"train_loss": 5.060440116827722, "train_lr": 0.0011753067044091045, "train_wd": 0.219292721514853, "epoch": 199}
201
+ {"train_loss": 5.059170163709292, "train_lr": 0.0011662558416783448, "train_wd": 0.22070643094188536, "epoch": 200}
202
+ {"train_loss": 5.0590799166608775, "train_lr": 0.0011572023343594264, "train_wd": 0.22212009679292866, "epoch": 201}
203
+ {"train_loss": 5.057440980208768, "train_lr": 0.0011481467699214608, "train_wd": 0.22353363186641545, "epoch": 202}
204
+ {"train_loss": 5.057461818553609, "train_lr": 0.0011390897359670493, "train_wd": 0.22494694896884398, "epoch": 203}
205
+ {"train_loss": 5.054592366460606, "train_lr": 0.0011300318201941445, "train_wd": 0.2263599609201577, "epoch": 204}
206
+ {"train_loss": 5.0537276357817325, "train_lr": 0.001120973610357927, "train_wd": 0.22777258055912372, "epoch": 205}
207
+ {"train_loss": 5.0514625969896025, "train_lr": 0.0011119156942326432, "train_wd": 0.2291847207487093, "epoch": 206}
208
+ {"train_loss": 5.0508974054031714, "train_lr": 0.0011028586595734913, "train_wd": 0.23059629438145465, "epoch": 207}
209
+ {"train_loss": 5.047175745514752, "train_lr": 0.0010938030940784746, "train_wd": 0.2320072143848498, "epoch": 208}
210
+ {"train_loss": 5.046830037836548, "train_lr": 0.0010847495853502605, "train_wd": 0.23341739372670214, "epoch": 209}
211
+ {"train_loss": 5.046326884763133, "train_lr": 0.0010756987208580574, "train_wd": 0.23482674542050871, "epoch": 210}
212
+ {"train_loss": 5.047194545241378, "train_lr": 0.0010666510878994864, "train_wd": 0.2362351825308164, "epoch": 211}
213
+ {"train_loss": 5.040715190241758, "train_lr": 0.0010576072735624896, "train_wd": 0.23764261817859192, "epoch": 212}
214
+ {"train_loss": 5.040514496036714, "train_lr": 0.0010485678646872164, "train_wd": 0.23904896554657432, "epoch": 213}
215
+ {"train_loss": 5.036664680468379, "train_lr": 0.0010395334478279575, "train_wd": 0.24045413788463224, "epoch": 214}
216
+ {"train_loss": 5.0360095577953246, "train_lr": 0.001030504609215075, "train_wd": 0.2418580485151181, "epoch": 215}
217
+ {"train_loss": 5.034671847697356, "train_lr": 0.0010214819347169625, "train_wd": 0.2432606108382111, "epoch": 216}
218
+ {"train_loss": 5.031384058749314, "train_lr": 0.0010124660098020438, "train_wd": 0.2446617383372606, "epoch": 217}
219
+ {"train_loss": 5.029689934185083, "train_lr": 0.0010034574195007656, "train_wd": 0.246061344584122, "epoch": 218}
220
+ {"train_loss": 5.027825422388473, "train_lr": 0.0009944567483676431, "train_wd": 0.24745934324448998, "epoch": 219}
221
+ {"train_loss": 5.024332265261647, "train_lr": 0.000985464580443327, "train_wd": 0.2488556480832213, "epoch": 220}
222
+ {"train_loss": 5.023203111928907, "train_lr": 0.0009764814992167072, "train_wd": 0.250250172969656, "epoch": 221}
223
+ {"train_loss": 5.020969932283953, "train_lr": 0.0009675080875870501, "train_wd": 0.25164283188293163, "epoch": 222}
224
+ {"train_loss": 5.017743961863237, "train_lr": 0.0009585449278261788, "train_wd": 0.2530335389172849, "epoch": 223}
225
+ {"train_loss": 5.01558007916315, "train_lr": 0.0009495926015406867, "train_wd": 0.2544222082873567, "epoch": 224}
226
+ {"train_loss": 5.008099335727455, "train_lr": 0.0009406516896341935, "train_wd": 0.2558087543334778, "epoch": 225}
227
+ {"train_loss": 5.007489387478998, "train_lr": 0.0009317227722696614, "train_wd": 0.25719309152695813, "epoch": 226}
228
+ {"train_loss": 5.00511942087389, "train_lr": 0.000922806428831744, "train_wd": 0.2585751344753574, "epoch": 227}
229
+ {"train_loss": 5.003316748395955, "train_lr": 0.000913903237889186, "train_wd": 0.2599547979277569, "epoch": 228}
230
+ {"train_loss": 5.00074020510526, "train_lr": 0.0009050137771572951, "train_wd": 0.2613319967800164, "epoch": 229}
231
+ {"train_loss": 4.996222538717216, "train_lr": 0.000896138623460436, "train_wd": 0.26270664608002364, "epoch": 230}
232
+ {"train_loss": 4.994506737745875, "train_lr": 0.0008872783526946113, "train_wd": 0.26407866103293454, "epoch": 231}
233
+ {"train_loss": 4.992520922802383, "train_lr": 0.0008784335397900937, "train_wd": 0.2654479570064033, "epoch": 232}
234
+ {"train_loss": 4.988456529149001, "train_lr": 0.0008696047586741224, "train_wd": 0.2668144495358054, "epoch": 233}
235
+ {"train_loss": 4.986210458754874, "train_lr": 0.0008607925822336454, "train_wd": 0.2681780543294442, "epoch": 234}
236
+ {"train_loss": 4.982131213503633, "train_lr": 0.0008519975822781682, "train_wd": 0.269538687273754, "epoch": 235}
237
+ {"train_loss": 4.980333292792789, "train_lr": 0.0008432203295026338, "train_wd": 0.27089626443848336, "epoch": 236}
238
+ {"train_loss": 4.975452028703299, "train_lr": 0.0008344613934503925, "train_wd": 0.27225070208187957, "epoch": 237}
239
+ {"train_loss": 4.971105074371509, "train_lr": 0.0008257213424762576, "train_wd": 0.27360191665584904, "epoch": 238}
240
+ {"train_loss": 4.968936504166332, "train_lr": 0.0008170007437096112, "train_wd": 0.2749498248111106, "epoch": 239}
241
+ {"train_loss": 4.9655094626996155, "train_lr": 0.0008083001630176061, "train_wd": 0.2762943434023426, "epoch": 240}
242
+ {"train_loss": 4.961010154542163, "train_lr": 0.0007996201649684595, "train_wd": 0.277635389493303, "epoch": 241}
243
+ {"train_loss": 4.957728406007913, "train_lr": 0.0007909613127948033, "train_wd": 0.2789728803619521, "epoch": 242}
244
+ {"train_loss": 4.953317111737722, "train_lr": 0.0007823241683571459, "train_wd": 0.2803067335055533, "epoch": 243}
245
+ {"train_loss": 4.948795519876394, "train_lr": 0.0007737092921074157, "train_wd": 0.28163686664576215, "epoch": 244}
246
+ {"train_loss": 4.945552291141616, "train_lr": 0.0007651172430525858, "train_wd": 0.2829631977337003, "epoch": 245}
247
+ {"train_loss": 4.94089244935605, "train_lr": 0.0007565485787184022, "train_wd": 0.284285644955019, "epoch": 246}
248
+ {"train_loss": 4.935349420570641, "train_lr": 0.0007480038551132194, "train_wd": 0.2856041267349452, "epoch": 247}
249
+ {"train_loss": 4.931657168153617, "train_lr": 0.000739483626691908, "train_wd": 0.28691856174331076, "epoch": 248}
250
+ {"train_loss": 4.925338470261637, "train_lr": 0.0007309884463198738, "train_wd": 0.28822886889957433, "epoch": 249}
251
+ {"train_loss": 4.922023578007206, "train_lr": 0.0007225188652372023, "train_wd": 0.2895349673778164, "epoch": 250}
252
+ {"train_loss": 4.917414636283422, "train_lr": 0.0007140754330228696, "train_wd": 0.2908367766117324, "epoch": 251}
253
+ {"train_loss": 4.912831997145995, "train_lr": 0.0007056586975590948, "train_wd": 0.2921342162995959, "epoch": 252}
254
+ {"train_loss": 4.907177175936415, "train_lr": 0.0006972692049957806, "train_wd": 0.2934272064092154, "epoch": 253}
255
+ {"train_loss": 4.904839147844141, "train_lr": 0.0006889074997150731, "train_wd": 0.2947156671828704, "epoch": 254}
256
+ {"train_loss": 4.8981898162338275, "train_lr": 0.00068057412429605, "train_wd": 0.29599951914223155, "epoch": 255}
257
+ {"train_loss": 4.894370648036186, "train_lr": 0.0006722696194794978, "train_wd": 0.2972786830932622, "epoch": 256}
258
+ {"train_loss": 4.8881712039109235, "train_lr": 0.000663994524132831, "train_wd": 0.29855308013110454, "epoch": 257}
259
+ {"train_loss": 4.884381202234924, "train_lr": 0.0006557493752151325, "train_wd": 0.29982263164494594, "epoch": 258}
260
+ {"train_loss": 4.880416413046997, "train_lr": 0.0006475347077422958, "train_wd": 0.30108725932287034, "epoch": 259}
261
+ {"train_loss": 4.875331898685173, "train_lr": 0.0006393510547523213, "train_wd": 0.3023468851566843, "epoch": 260}
262
+ {"train_loss": 4.867493334320857, "train_lr": 0.0006311989472707278, "train_wd": 0.30360143144673274, "epoch": 261}
263
+ {"train_loss": 4.863474253675253, "train_lr": 0.000623078914276085, "train_wd": 0.3048508208066917, "epoch": 262}
264
+ {"train_loss": 4.858651462290212, "train_lr": 0.0006149914826656965, "train_wd": 0.3060949761683405, "epoch": 263}
265
+ {"train_loss": 4.853368350290518, "train_lr": 0.0006069371772214114, "train_wd": 0.3073338207863162, "epoch": 264}
266
+ {"train_loss": 4.84878363189318, "train_lr": 0.0005989165205755661, "train_wd": 0.30856727824284547, "epoch": 265}
267
+ {"train_loss": 4.843794696646438, "train_lr": 0.000590930033177077, "train_wd": 0.3097952724524647, "epoch": 266}
268
+ {"train_loss": 4.837881371331253, "train_lr": 0.0005829782332576656, "train_wd": 0.31101772766670555, "epoch": 267}
269
+ {"train_loss": 4.833974913233142, "train_lr": 0.0005750616367982363, "train_wd": 0.3122345684787717, "epoch": 268}
270
+ {"train_loss": 4.82714938720782, "train_lr": 0.0005671807574953849, "train_wd": 0.3134457198281908, "epoch": 269}
271
+ {"train_loss": 4.820540842201879, "train_lr": 0.000559336106728078, "train_wd": 0.31465110700544185, "epoch": 270}
272
+ {"train_loss": 4.814345674453784, "train_lr": 0.0005515281935244598, "train_wd": 0.3158506556565671, "epoch": 271}
273
+ {"train_loss": 4.80803205215221, "train_lr": 0.0005437575245288296, "train_wd": 0.3170442917877532, "epoch": 272}
274
+ {"train_loss": 4.800921055785329, "train_lr": 0.0005360246039687654, "train_wd": 0.318231941769903, "epoch": 273}
275
+ {"train_loss": 4.797511439154045, "train_lr": 0.0005283299336223971, "train_wd": 0.3194135323431709, "epoch": 274}
276
+ {"train_loss": 4.790865347110968, "train_lr": 0.0005206740127858584, "train_wd": 0.3205889906214848, "epoch": 275}
277
+ {"train_loss": 4.785187482595634, "train_lr": 0.0005130573382408798, "train_wd": 0.32175824409704, "epoch": 276}
278
+ {"train_loss": 4.777992897748137, "train_lr": 0.0005054804042225596, "train_wd": 0.3229212206447756, "epoch": 277}
279
+ {"train_loss": 4.771080911993313, "train_lr": 0.0004979437023872868, "train_wd": 0.32407784852681937, "epoch": 278}
280
+ {"train_loss": 4.7652488085780025, "train_lr": 0.0004904477217808411, "train_wd": 0.3252280563969152, "epoch": 279}
281
+ {"train_loss": 4.760241817239282, "train_lr": 0.00048299294880666595, "train_wd": 0.32637177330482514, "epoch": 280}
282
+ {"train_loss": 4.752522000442926, "train_lr": 0.00047557986719429327, "train_wd": 0.32750892870070053, "epoch": 281}
283
+ {"train_loss": 4.747531998059828, "train_lr": 0.0004682089579679648, "train_wd": 0.3286394524394421, "epoch": 282}
284
+ {"train_loss": 4.7417209265317375, "train_lr": 0.00046088069941542097, "train_wd": 0.32976327478502, "epoch": 283}
285
+ {"train_loss": 4.735434948135432, "train_lr": 0.0004535955670568559, "train_wd": 0.3308803264147775, "epoch": 284}
286
+ {"train_loss": 4.728086945583685, "train_lr": 0.0004463540336140675, "train_wd": 0.33199053842370807, "epoch": 285}
287
+ {"train_loss": 4.7221498096184575, "train_lr": 0.0004391565689797834, "train_wd": 0.3330938423287066, "epoch": 286}
288
+ {"train_loss": 4.7145808008339385, "train_lr": 0.00043200364018716904, "train_wd": 0.334190170072791, "epoch": 287}
289
+ {"train_loss": 4.708020688645798, "train_lr": 0.0004248957113795247, "train_wd": 0.33527945402930165, "epoch": 288}
290
+ {"train_loss": 4.701343006903319, "train_lr": 0.00041783324378016364, "train_wd": 0.33636162700607314, "epoch": 289}
291
+ {"train_loss": 4.69468024152098, "train_lr": 0.00041081669566248795, "train_wd": 0.33743662224957915, "epoch": 290}
292
+ {"train_loss": 4.685200823141898, "train_lr": 0.00040384652232024974, "train_wd": 0.33850437344904766, "epoch": 291}
293
+ {"train_loss": 4.678547248387223, "train_lr": 0.00039692317603800767, "train_wd": 0.3395648147405573, "epoch": 292}
294
+ {"train_loss": 4.670517399704618, "train_lr": 0.0003900471060617836, "train_wd": 0.3406178807110933, "epoch": 293}
295
+ {"train_loss": 4.662524536359224, "train_lr": 0.0003832187585698995, "train_wd": 0.3416635064025855, "epoch": 294}
296
+ {"train_loss": 4.654399912860944, "train_lr": 0.000376438576644043, "train_wd": 0.3427016273159168, "epoch": 295}
297
+ {"train_loss": 4.6471501504607815, "train_lr": 0.00036970700024050064, "train_wd": 0.3437321794148987, "epoch": 296}
298
+ {"train_loss": 4.638612014468578, "train_lr": 0.00036302446616161873, "train_wd": 0.3447550991302242, "epoch": 297}
299
+ {"train_loss": 4.631100932262736, "train_lr": 0.0003563914080274577, "train_wd": 0.3457703233633857, "epoch": 298}
300
+ {"train_loss": 4.623134244629424, "train_lr": 0.00034980825624765456, "train_wd": 0.3467777894905715, "epoch": 299}
301
+ {"train_loss": 4.615148453886132, "train_lr": 0.0003432754379934938, "train_wd": 0.34777743536652517, "epoch": 300}
302
+ {"train_loss": 4.606329397522479, "train_lr": 0.00033679337717018934, "train_wd": 0.34876919932837885, "epoch": 301}
303
+ {"train_loss": 4.599237131653167, "train_lr": 0.000330362494389381, "train_wd": 0.3497530201994611, "epoch": 302}
304
+ {"train_loss": 4.59081717819976, "train_lr": 0.000323983206941835, "train_wd": 0.35072883729306636, "epoch": 303}
305
+ {"train_loss": 4.582908008977187, "train_lr": 0.00031765592877037253, "train_wd": 0.35169659041620094, "epoch": 304}
306
+ {"train_loss": 4.5733358861564355, "train_lr": 0.0003113810704430055, "train_wd": 0.3526562198732908, "epoch": 305}
307
+ {"train_loss": 4.564309866087948, "train_lr": 0.0003051590391262999, "train_wd": 0.3536076664698735, "epoch": 306}
308
+ {"train_loss": 4.555662704767179, "train_lr": 0.0002989902385589515, "train_wd": 0.3545508715162375, "epoch": 307}
309
+ {"train_loss": 4.54760512836474, "train_lr": 0.00029287506902558793, "train_wd": 0.3554857768310568, "epoch": 308}
310
+ {"train_loss": 4.53756690811482, "train_lr": 0.000286813927330797, "train_wd": 0.3564123247449674, "epoch": 309}
311
+ {"train_loss": 4.529608110807163, "train_lr": 0.00028080720677337815, "train_wd": 0.3573304581041274, "epoch": 310}
312
+ {"train_loss": 4.5196145807238794, "train_lr": 0.00027485529712081977, "train_wd": 0.3582401202737472, "epoch": 311}
313
+ {"train_loss": 4.509118945954992, "train_lr": 0.0002689585845840098, "train_wd": 0.3591412551415791, "epoch": 312}
314
+ {"train_loss": 4.502537519132776, "train_lr": 0.0002631174517921747, "train_wd": 0.36003380712137945, "epoch": 313}
315
+ {"train_loss": 4.492621650977386, "train_lr": 0.00025733227776804986, "train_wd": 0.3609177211563397, "epoch": 314}
316
+ {"train_loss": 4.482963060857438, "train_lr": 0.0002516034379032888, "train_wd": 0.3617929427224776, "epoch": 315}
317
+ {"train_loss": 4.475395755706836, "train_lr": 0.00024593130393409855, "train_wd": 0.3626594178320025, "epoch": 316}
318
+ {"train_loss": 4.463723065374757, "train_lr": 0.00024031624391712564, "train_wd": 0.36351709303664975, "epoch": 317}
319
+ {"train_loss": 4.4534207991511225, "train_lr": 0.00023475862220556713, "train_wd": 0.3643659154309737, "epoch": 318}
320
+ {"train_loss": 4.443745340702297, "train_lr": 0.00022925879942553156, "train_wd": 0.365205832655609, "epoch": 319}
321
+ {"train_loss": 4.434112533426685, "train_lr": 0.00022381713245263766, "train_wd": 0.36603679290050706, "epoch": 320}
322
+ {"train_loss": 4.423886619133057, "train_lr": 0.00021843397438885736, "train_wd": 0.36685874490812154, "epoch": 321}
323
+ {"train_loss": 4.412763283365398, "train_lr": 0.0002131096745396021, "train_wd": 0.3676716379765859, "epoch": 322}
324
+ {"train_loss": 4.401639608509964, "train_lr": 0.00020784457839105946, "train_wd": 0.36847542196282307, "epoch": 323}
325
+ {"train_loss": 4.390171518541878, "train_lr": 0.00020263902758777447, "train_wd": 0.369270047285652, "epoch": 324}
326
+ {"train_loss": 4.379141875975233, "train_lr": 0.00019749335991047762, "train_wd": 0.37005546492884, "epoch": 325}
327
+ {"train_loss": 4.368495727936141, "train_lr": 0.00019240790925417048, "train_wd": 0.37083162644412637, "epoch": 326}
328
+ {"train_loss": 4.357273751126824, "train_lr": 0.00018738300560645915, "train_wd": 0.3715984839542151, "epoch": 327}
329
+ {"train_loss": 4.346397876596565, "train_lr": 0.0001824189750261398, "train_wd": 0.3723559901557198, "epoch": 328}
330
+ {"train_loss": 4.33588796622938, "train_lr": 0.00017751613962204397, "train_wd": 0.3731040983220901, "epoch": 329}
331
+ {"train_loss": 4.3238908172511366, "train_lr": 0.00017267481753213337, "train_wd": 0.37384276230649194, "epoch": 330}
332
+ {"train_loss": 4.312422900760679, "train_lr": 0.0001678953229028614, "train_wd": 0.3745719365446499, "epoch": 331}
333
+ {"train_loss": 4.300488709242081, "train_lr": 0.0001631779658687858, "train_wd": 0.3752915760576642, "epoch": 332}
334
+ {"train_loss": 4.288683925547617, "train_lr": 0.00015852305253244374, "train_wd": 0.3760016364547775, "epoch": 333}
335
+ {"train_loss": 4.276059366786461, "train_lr": 0.0001539308849444909, "train_wd": 0.37670207393612165, "epoch": 334}
336
+ {"train_loss": 4.264887864337408, "train_lr": 0.0001494017610841008, "train_wd": 0.3773928452954123, "epoch": 335}
337
+ {"train_loss": 4.251469054620424, "train_lr": 0.00014493597483963136, "train_wd": 0.3780739079226194, "epoch": 336}
338
+ {"train_loss": 4.239295731387217, "train_lr": 0.00014053381598955113, "train_wd": 0.3787452198065901, "epoch": 337}
339
+ {"train_loss": 4.225657296415379, "train_lr": 0.0001361955701836397, "train_wd": 0.37940673953764753, "epoch": 338}
340
+ {"train_loss": 4.213763868440684, "train_lr": 0.0001319215189244515, "train_wd": 0.3800584263101365, "epoch": 339}
341
+ {"train_loss": 4.200215282962382, "train_lr": 0.00012771193954904587, "train_wd": 0.38070023992494867, "epoch": 340}
342
+ {"train_loss": 4.187662810569615, "train_lr": 0.0001235671052109971, "train_wd": 0.38133214079199634, "epoch": 341}
343
+ {"train_loss": 4.175019946946896, "train_lr": 0.00011948728486266541, "train_wd": 0.38195408993265745, "epoch": 342}
344
+ {"train_loss": 4.162678389091619, "train_lr": 0.00011547274323774695, "train_wd": 0.38256604898217966, "epoch": 343}
345
+ {"train_loss": 4.147709864530442, "train_lr": 0.00011152374083409392, "train_wd": 0.38316798019204706, "epoch": 344}
346
+ {"train_loss": 4.1348062732475075, "train_lr": 0.00010764053389681373, "train_wd": 0.3837598464323059, "epoch": 345}
347
+ {"train_loss": 4.121832250458874, "train_lr": 0.00010382337440163965, "train_wd": 0.38434161119385885, "epoch": 346}
348
+ {"train_loss": 4.108135711708419, "train_lr": 0.00010007251003858072, "train_wd": 0.38491323859071513, "epoch": 347}
349
+ {"train_loss": 4.093841604453673, "train_lr": 9.638818419585105e-05, "train_wd": 0.3854746933622053, "epoch": 348}
350
+ {"train_loss": 4.078653924607878, "train_lr": 9.277063594407402e-05, "train_wd": 0.38602594087515296, "epoch": 349}
351
+ {"train_loss": 4.065404155616947, "train_lr": 8.922010002077167e-05, "train_wd": 0.38656694712601525, "epoch": 350}
352
+ {"train_loss": 4.052191693106477, "train_lr": 8.573680681513209e-05, "train_wd": 0.3870976787429777, "epoch": 351}
353
+ {"train_loss": 4.03811537301083, "train_lr": 8.232098235305936e-05, "train_wd": 0.38761810298801663, "epoch": 352}
354
+ {"train_loss": 4.023593600788753, "train_lr": 7.897284828250804e-05, "train_wd": 0.3881281877589109, "epoch": 353}
355
+ {"train_loss": 4.0070806405574775, "train_lr": 7.569262185910003e-05, "train_wd": 0.3886279015912286, "epoch": 354}
356
+ {"train_loss": 3.9945585182149537, "train_lr": 7.248051593202686e-05, "train_wd": 0.38911721366026947, "epoch": 355}
357
+ {"train_loss": 3.9797920682828583, "train_lr": 6.933673893023928e-05, "train_wd": 0.3895960937829577, "epoch": 356}
358
+ {"train_loss": 3.9654532474019737, "train_lr": 6.626149484892149e-05, "train_wd": 0.3900645124197119, "epoch": 357}
359
+ {"train_loss": 3.951138318031669, "train_lr": 6.325498323625508e-05, "train_wd": 0.39052244067626624, "epoch": 358}
360
+ {"train_loss": 3.935840425945872, "train_lr": 6.031739918047009e-05, "train_wd": 0.39096985030544645, "epoch": 359}
361
+ {"train_loss": 3.921667525319935, "train_lr": 5.74489332971862e-05, "train_wd": 0.3914067137089192, "epoch": 360}
362
+ {"train_loss": 3.9084897777564422, "train_lr": 5.464977171704377e-05, "train_wd": 0.39183300393889414, "epoch": 361}
363
+ {"train_loss": 3.8933815875118203, "train_lr": 5.19200960736264e-05, "train_wd": 0.39224869469977885, "epoch": 362}
364
+ {"train_loss": 3.8777786941408254, "train_lr": 4.9260083491675006e-05, "train_wd": 0.3926537603498122, "epoch": 363}
365
+ {"train_loss": 3.8640478378553373, "train_lr": 4.666990657559381e-05, "train_wd": 0.3930481759026342, "epoch": 364}
366
+ {"train_loss": 3.849154220383278, "train_lr": 4.414973339825131e-05, "train_wd": 0.3934319170288371, "epoch": 365}
367
+ {"train_loss": 3.83686304494417, "train_lr": 4.16997274900732e-05, "train_wd": 0.3938049600574607, "epoch": 366}
368
+ {"train_loss": 3.821596854912053, "train_lr": 3.9320047828431966e-05, "train_wd": 0.394167281977453, "epoch": 367}
369
+ {"train_loss": 3.8074215755081005, "train_lr": 3.7010848827330696e-05, "train_wd": 0.3945188604390926, "epoch": 368}
370
+ {"train_loss": 3.794100793985297, "train_lr": 3.477228032738327e-05, "train_wd": 0.394859673755362, "epoch": 369}
371
+ {"train_loss": 3.780965423138498, "train_lr": 3.26044875860917e-05, "train_wd": 0.3951897009032925, "epoch": 370}
372
+ {"train_loss": 3.767160097204095, "train_lr": 3.0507611268420424e-05, "train_wd": 0.3955089215252535, "epoch": 371}
373
+ {"train_loss": 3.754950592462584, "train_lr": 2.848178743766871e-05, "train_wd": 0.39581731593021396, "epoch": 372}
374
+ {"train_loss": 3.7406982700589846, "train_lr": 2.652714754664177e-05, "train_wd": 0.39611486509495486, "epoch": 373}
375
+ {"train_loss": 3.729427683172371, "train_lr": 2.4643818429121177e-05, "train_wd": 0.39640155066524146, "epoch": 374}
376
+ {"train_loss": 3.7165080270023463, "train_lr": 2.283192229163428e-05, "train_wd": 0.3966773549569573, "epoch": 375}
377
+ {"train_loss": 3.7044468289501755, "train_lr": 2.1091576705524968e-05, "train_wd": 0.3969422609571956, "epoch": 376}
378
+ {"train_loss": 3.6929199265347394, "train_lr": 1.942289459932436e-05, "train_wd": 0.3971962523253041, "epoch": 377}
379
+ {"train_loss": 3.6810429938655678, "train_lr": 1.782598425142293e-05, "train_wd": 0.3974393133939014, "epoch": 378}
380
+ {"train_loss": 3.6709727578514295, "train_lr": 1.630094928304469e-05, "train_wd": 0.39767142916983467, "epoch": 379}
381
+ {"train_loss": 3.6602019294262598, "train_lr": 1.4847888651523358e-05, "train_wd": 0.3978925853351094, "epoch": 380}
382
+ {"train_loss": 3.649509161853676, "train_lr": 1.346689664388093e-05, "train_wd": 0.39810276824777074, "epoch": 381}
383
+ {"train_loss": 3.640537181578809, "train_lr": 1.2158062870709786e-05, "train_wd": 0.39830196494274944, "epoch": 382}
384
+ {"train_loss": 3.631285222439314, "train_lr": 1.0921472260357805e-05, "train_wd": 0.39849016313265234, "epoch": 383}
385
+ {"train_loss": 3.6212902165216794, "train_lr": 9.7572050534176e-06, "train_wd": 0.39866735120852914, "epoch": 384}
386
+ {"train_loss": 3.6128972267730535, "train_lr": 8.665336797519755e-06, "train_wd": 0.3988335182405865, "epoch": 385}
387
+ {"train_loss": 3.606880258831332, "train_lr": 7.64593834243072e-06, "train_wd": 0.3989886539788556, "epoch": 386}
388
+ {"train_loss": 3.5982171260028912, "train_lr": 6.699075835455352e-06, "train_wd": 0.3991327488538374, "epoch": 387}
389
+ {"train_loss": 3.591992610947882, "train_lr": 5.82481071714485e-06, "train_wd": 0.3992657939770773, "epoch": 388}
390
+ {"train_loss": 3.585490051564648, "train_lr": 5.023199717309857e-06, "train_wd": 0.3993877811417291, "epoch": 389}
391
+ {"train_loss": 3.580611295039229, "train_lr": 4.294294851339406e-06, "train_wd": 0.3994987028230467, "epoch": 390}
392
+ {"train_loss": 3.5747398439702467, "train_lr": 3.6381434168256834e-06, "train_wd": 0.3995985521788607, "epoch": 391}
393
+ {"train_loss": 3.5716226860392486, "train_lr": 3.0547879904949834e-06, "train_wd": 0.39968732304999155, "epoch": 392}
394
+ {"train_loss": 3.567668136974557, "train_lr": 2.5442664254449134e-06, "train_wd": 0.3997650099606345, "epoch": 393}
395
+ {"train_loss": 3.564820939110671, "train_lr": 2.1066118486882486e-06, "train_wd": 0.3998316081186933, "epoch": 394}
396
+ {"train_loss": 3.5610559352284237, "train_lr": 1.741852659003286e-06, "train_wd": 0.3998871134160813, "epoch": 395}
397
+ {"train_loss": 3.5592307050665504, "train_lr": 1.45001252509112e-06, "train_wd": 0.39993152242896945, "epoch": 396}
398
+ {"train_loss": 3.55706747188914, "train_lr": 1.2311103840398177e-06, "train_wd": 0.3999648324180009, "epoch": 397}
399
+ {"train_loss": 3.5563410500780663, "train_lr": 1.0851604400956189e-06, "train_wd": 0.39998704132845964, "epoch": 398}
400
+ {"train_loss": 3.5548059027031553, "train_lr": 1.012172163741218e-06, "train_wd": 0.3999981477903932, "epoch": 399}
Vim/Base/log_eval.txt ADDED
@@ -0,0 +1,100 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"train_lr": 0.0019999999999998686, "train_loss": 1.40141621739851, "epoch": 0, "test_loss": 0.9865021037552363, "test_acc1": 75.178, "test_acc5": 92.982}
2
+ {"train_lr": 0.0019995065603657376, "train_loss": 1.0348678242431562, "epoch": 1, "test_loss": 0.9310997676513993, "test_acc1": 76.474, "test_acc5": 93.7}
3
+ {"train_lr": 0.0019980267284282105, "train_loss": 0.9869975087627667, "epoch": 2, "test_loss": 0.9145035531057422, "test_acc1": 76.83, "test_acc5": 93.972}
4
+ {"train_lr": 0.001995561964603092, "train_loss": 0.9697637621475561, "epoch": 3, "test_loss": 0.909291505851709, "test_acc1": 76.958, "test_acc5": 93.968}
5
+ {"train_lr": 0.0019921147013145773, "train_loss": 0.9620687462660346, "epoch": 4, "test_loss": 0.9025258075283922, "test_acc1": 77.164, "test_acc5": 94.022}
6
+ {"train_lr": 0.0019876883405950175, "train_loss": 0.9578788713591126, "epoch": 5, "test_loss": 0.901965103376552, "test_acc1": 77.208, "test_acc5": 94.144}
7
+ {"train_lr": 0.0019822872507288198, "train_loss": 0.9580256745570477, "epoch": 6, "test_loss": 0.9055825617269176, "test_acc1": 77.122, "test_acc5": 93.974}
8
+ {"train_lr": 0.0019759167619387524, "train_loss": 0.9558512604253272, "epoch": 7, "test_loss": 0.9059519183147898, "test_acc1": 77.144, "test_acc5": 94.052}
9
+ {"train_lr": 0.001968583161128624, "train_loss": 0.9566828705909202, "epoch": 8, "test_loss": 0.9028019275506745, "test_acc1": 76.944, "test_acc5": 94.07}
10
+ {"train_lr": 0.001960293685677003, "train_loss": 0.956073425388722, "epoch": 9, "test_loss": 0.9031169299617448, "test_acc1": 77.144, "test_acc5": 94.112}
11
+ {"train_lr": 0.0019510565162951365, "train_loss": 0.9550017401474836, "epoch": 10, "test_loss": 0.905227641277301, "test_acc1": 77.096, "test_acc5": 94.036}
12
+ {"train_lr": 0.0019408807689541316, "train_loss": 0.955112198264276, "epoch": 11, "test_loss": 0.9057276449773622, "test_acc1": 76.96, "test_acc5": 94.116}
13
+ {"train_lr": 0.0019297764858882515, "train_loss": 0.9544162914377187, "epoch": 12, "test_loss": 0.8991024241499279, "test_acc1": 77.182, "test_acc5": 94.07}
14
+ {"train_lr": 0.0019177546256839834, "train_loss": 0.9518558204388361, "epoch": 13, "test_loss": 0.9029132409207047, "test_acc1": 77.148, "test_acc5": 94.106}
15
+ {"train_lr": 0.0019048270524661083, "train_loss": 0.9521451800722291, "epoch": 14, "test_loss": 0.9020788964560574, "test_acc1": 77.166, "test_acc5": 94.098}
16
+ {"train_lr": 0.0018910065241883177, "train_loss": 0.9519058762016269, "epoch": 15, "test_loss": 0.9008350587638138, "test_acc1": 77.372, "test_acc5": 94.084}
17
+ {"train_lr": 0.0018763066800438779, "train_loss": 0.9501215885197978, "epoch": 16, "test_loss": 0.8995034295465331, "test_acc1": 77.166, "test_acc5": 94.106}
18
+ {"train_lr": 0.0018607420270040137, "train_loss": 0.9509523625177143, "epoch": 17, "test_loss": 0.9015122564781047, "test_acc1": 77.132, "test_acc5": 94.088}
19
+ {"train_lr": 0.001844327925502041, "train_loss": 0.9506614573427881, "epoch": 18, "test_loss": 0.9019210995996699, "test_acc1": 77.044, "test_acc5": 94.12}
20
+ {"train_lr": 0.0018270805742745338, "train_loss": 0.9494276777999285, "epoch": 19, "test_loss": 0.90103893073471, "test_acc1": 77.25, "test_acc5": 94.088}
21
+ {"train_lr": 0.0018090169943749148, "train_loss": 0.9505323343785629, "epoch": 20, "test_loss": 0.9006480204746546, "test_acc1": 77.428, "test_acc5": 94.092}
22
+ {"train_lr": 0.001790155012375684, "train_loss": 0.9485720025715569, "epoch": 21, "test_loss": 0.8997843418356097, "test_acc1": 77.12, "test_acc5": 94.208}
23
+ {"train_lr": 0.00177051324277586, "train_loss": 0.948674776570896, "epoch": 22, "test_loss": 0.9026018450860782, "test_acc1": 77.192, "test_acc5": 94.122}
24
+ {"train_lr": 0.0017501110696303821, "train_loss": 0.9482977606454374, "epoch": 23, "test_loss": 0.8989825765495105, "test_acc1": 77.122, "test_acc5": 94.152}
25
+ {"train_lr": 0.001728968627421389, "train_loss": 0.9476831507918552, "epoch": 24, "test_loss": 0.8985824516743345, "test_acc1": 77.31, "test_acc5": 94.15}
26
+ {"train_lr": 0.0017071067811865767, "train_loss": 0.947474068536003, "epoch": 25, "test_loss": 0.9014654404976788, "test_acc1": 77.122, "test_acc5": 94.098}
27
+ {"train_lr": 0.0016845471059286062, "train_loss": 0.9458773597521254, "epoch": 26, "test_loss": 0.8992767619050067, "test_acc1": 77.268, "test_acc5": 94.146}
28
+ {"train_lr": 0.001661311865323677, "train_loss": 0.9460675816118265, "epoch": 27, "test_loss": 0.9003824421664333, "test_acc1": 77.312, "test_acc5": 94.132}
29
+ {"train_lr": 0.001637423989748733, "train_loss": 0.9438698154494994, "epoch": 28, "test_loss": 0.8985944117426568, "test_acc1": 77.376, "test_acc5": 94.12}
30
+ {"train_lr": 0.001612907053652909, "train_loss": 0.9444277047027457, "epoch": 29, "test_loss": 0.8961834871707974, "test_acc1": 77.382, "test_acc5": 94.132}
31
+ {"train_lr": 0.0015877852522924111, "train_loss": 0.9442095617014696, "epoch": 30, "test_loss": 0.8953145001931568, "test_acc1": 77.306, "test_acc5": 94.134}
32
+ {"train_lr": 0.0015620833778521046, "train_loss": 0.9420731575892441, "epoch": 31, "test_loss": 0.8949859906035615, "test_acc1": 77.372, "test_acc5": 94.138}
33
+ {"train_lr": 0.0015358267949790963, "train_loss": 0.9417429002722978, "epoch": 32, "test_loss": 0.8941260026696393, "test_acc1": 77.414, "test_acc5": 94.208}
34
+ {"train_lr": 0.0015090414157503675, "train_loss": 0.9393936146677279, "epoch": 33, "test_loss": 0.8951517046260102, "test_acc1": 77.498, "test_acc5": 94.188}
35
+ {"train_lr": 0.0014817536741017646, "train_loss": 0.9398717145817641, "epoch": 34, "test_loss": 0.8951449181570117, "test_acc1": 77.398, "test_acc5": 94.096}
36
+ {"train_lr": 0.001453990499739611, "train_loss": 0.9397707945059597, "epoch": 35, "test_loss": 0.8945940887684103, "test_acc1": 77.428, "test_acc5": 94.232}
37
+ {"train_lr": 0.0014257792915651636, "train_loss": 0.938914264136679, "epoch": 36, "test_loss": 0.8962938883877776, "test_acc1": 77.442, "test_acc5": 94.19}
38
+ {"train_lr": 0.001397147890634744, "train_loss": 0.9377800977937326, "epoch": 37, "test_loss": 0.8910840995171491, "test_acc1": 77.54, "test_acc5": 94.23}
39
+ {"train_lr": 0.001368124552684745, "train_loss": 0.9381735585436457, "epoch": 38, "test_loss": 0.8925753867306063, "test_acc1": 77.574, "test_acc5": 94.16}
40
+ {"train_lr": 0.0013387379202453142, "train_loss": 0.9369540920215419, "epoch": 39, "test_loss": 0.8923454177958886, "test_acc1": 77.496, "test_acc5": 94.28}
41
+ {"train_lr": 0.0013090169943749093, "train_loss": 0.9333221114668854, "epoch": 40, "test_loss": 0.8915809830055212, "test_acc1": 77.6, "test_acc5": 94.214}
42
+ {"train_lr": 0.0012789911060391633, "train_loss": 0.9338029348107276, "epoch": 41, "test_loss": 0.8893797928491212, "test_acc1": 77.69, "test_acc5": 94.288}
43
+ {"train_lr": 0.0012486898871647862, "train_loss": 0.9330607526810989, "epoch": 42, "test_loss": 0.8926802703258022, "test_acc1": 77.582, "test_acc5": 94.208}
44
+ {"train_lr": 0.001218143241396569, "train_loss": 0.9319615959168623, "epoch": 43, "test_loss": 0.8912819978564291, "test_acc1": 77.618, "test_acc5": 94.14}
45
+ {"train_lr": 0.0011873813145856604, "train_loss": 0.9313217092497417, "epoch": 44, "test_loss": 0.8883823378159262, "test_acc1": 77.658, "test_acc5": 94.192}
46
+ {"train_lr": 0.0011564344650402871, "train_loss": 0.9300515142664212, "epoch": 45, "test_loss": 0.8899350743312056, "test_acc1": 77.606, "test_acc5": 94.21}
47
+ {"train_lr": 0.0011253332335643327, "train_loss": 0.9290662591534998, "epoch": 46, "test_loss": 0.8883132905987523, "test_acc1": 77.494, "test_acc5": 94.272}
48
+ {"train_lr": 0.001094108313318475, "train_loss": 0.9279049030314243, "epoch": 47, "test_loss": 0.887962512919665, "test_acc1": 77.702, "test_acc5": 94.196}
49
+ {"train_lr": 0.0010627905195293463, "train_loss": 0.9270032352975879, "epoch": 48, "test_loss": 0.8868708503825585, "test_acc1": 77.718, "test_acc5": 94.302}
50
+ {"train_lr": 0.0010314107590780974, "train_loss": 0.9260229287305166, "epoch": 49, "test_loss": 0.8859207691515193, "test_acc1": 77.712, "test_acc5": 94.276}
51
+ {"train_lr": 0.0009999999999999343, "train_loss": 0.9257969355498654, "epoch": 50, "test_loss": 0.8849041308550274, "test_acc1": 77.782, "test_acc5": 94.24}
52
+ {"train_lr": 0.0009685892409218651, "train_loss": 0.9250000174991903, "epoch": 51, "test_loss": 0.884620481782862, "test_acc1": 77.722, "test_acc5": 94.198}
53
+ {"train_lr": 0.0009372094804707101, "train_loss": 0.9236977049054692, "epoch": 52, "test_loss": 0.8844312474398357, "test_acc1": 77.732, "test_acc5": 94.216}
54
+ {"train_lr": 0.0009058916866814987, "train_loss": 0.9236183154001933, "epoch": 53, "test_loss": 0.8849428826585755, "test_acc1": 77.694, "test_acc5": 94.272}
55
+ {"train_lr": 0.0008746667664356905, "train_loss": 0.9215438052374889, "epoch": 54, "test_loss": 0.886294969359932, "test_acc1": 77.49, "test_acc5": 94.248}
56
+ {"train_lr": 0.0008435655349597399, "train_loss": 0.9208157944395882, "epoch": 55, "test_loss": 0.8836620901627918, "test_acc1": 77.666, "test_acc5": 94.286}
57
+ {"train_lr": 0.0008126186854142688, "train_loss": 0.9194068921550579, "epoch": 56, "test_loss": 0.882629923579638, "test_acc1": 77.766, "test_acc5": 94.3}
58
+ {"train_lr": 0.0007818567586034925, "train_loss": 0.9191788917975191, "epoch": 57, "test_loss": 0.8819168749291574, "test_acc1": 77.992, "test_acc5": 94.278}
59
+ {"train_lr": 0.0007513101128351359, "train_loss": 0.9198855217449483, "epoch": 58, "test_loss": 0.88213624753763, "test_acc1": 77.852, "test_acc5": 94.3}
60
+ {"train_lr": 0.000721008893960812, "train_loss": 0.9176070873338701, "epoch": 59, "test_loss": 0.8837772236227075, "test_acc1": 77.798, "test_acc5": 94.354}
61
+ {"train_lr": 0.0006909830056250302, "train_loss": 0.9163718276347963, "epoch": 60, "test_loss": 0.8824031920841587, "test_acc1": 77.89, "test_acc5": 94.298}
62
+ {"train_lr": 0.0006612620797547435, "train_loss": 0.914866445025729, "epoch": 61, "test_loss": 0.8808865229339551, "test_acc1": 77.904, "test_acc5": 94.32}
63
+ {"train_lr": 0.0006318754473153419, "train_loss": 0.9150559181273817, "epoch": 62, "test_loss": 0.8808672300080205, "test_acc1": 77.956, "test_acc5": 94.306}
64
+ {"train_lr": 0.0006028521093652263, "train_loss": 0.9131123069681218, "epoch": 63, "test_loss": 0.8799271800024125, "test_acc1": 77.928, "test_acc5": 94.282}
65
+ {"train_lr": 0.000574220708434935, "train_loss": 0.9112918484856308, "epoch": 64, "test_loss": 0.8792256582957094, "test_acc1": 77.992, "test_acc5": 94.354}
66
+ {"train_lr": 0.0005460095002604524, "train_loss": 0.9100639034230805, "epoch": 65, "test_loss": 0.8801120497152933, "test_acc1": 77.99, "test_acc5": 94.296}
67
+ {"train_lr": 0.0005182463258982946, "train_loss": 0.9102253763558052, "epoch": 66, "test_loss": 0.8800176160643473, "test_acc1": 77.962, "test_acc5": 94.316}
68
+ {"train_lr": 0.0004909585842496341, "train_loss": 0.9088505878598033, "epoch": 67, "test_loss": 0.8804091747535769, "test_acc1": 77.986, "test_acc5": 94.304}
69
+ {"train_lr": 0.0004641732050210111, "train_loss": 0.9084323957217154, "epoch": 68, "test_loss": 0.8777954842885742, "test_acc1": 78.0, "test_acc5": 94.322}
70
+ {"train_lr": 0.0004379166221478616, "train_loss": 0.9075282472957862, "epoch": 69, "test_loss": 0.8784500328857271, "test_acc1": 78.066, "test_acc5": 94.38}
71
+ {"train_lr": 0.00041221474770750024, "train_loss": 0.9069060398056609, "epoch": 70, "test_loss": 0.8772927774187854, "test_acc1": 78.02, "test_acc5": 94.32}
72
+ {"train_lr": 0.0003870929463470055, "train_loss": 0.9070681458978332, "epoch": 71, "test_loss": 0.8766857854393132, "test_acc1": 78.132, "test_acc5": 94.306}
73
+ {"train_lr": 0.0003625760102513295, "train_loss": 0.9060561186877718, "epoch": 72, "test_loss": 0.8773289802281753, "test_acc1": 78.088, "test_acc5": 94.314}
74
+ {"train_lr": 0.0003386881346763327, "train_loss": 0.9050068777386446, "epoch": 73, "test_loss": 0.8769196353833694, "test_acc1": 78.088, "test_acc5": 94.328}
75
+ {"train_lr": 0.0003154528940713109, "train_loss": 0.9046978438366093, "epoch": 74, "test_loss": 0.8769187347587112, "test_acc1": 78.092, "test_acc5": 94.346}
76
+ {"train_lr": 0.00029289321881343744, "train_loss": 0.904974796434569, "epoch": 75, "test_loss": 0.8761430153685152, "test_acc1": 78.142, "test_acc5": 94.35}
77
+ {"train_lr": 0.0002710313725785874, "train_loss": 0.903332463122943, "epoch": 76, "test_loss": 0.8759037066451119, "test_acc1": 78.116, "test_acc5": 94.326}
78
+ {"train_lr": 0.0002498889303695469, "train_loss": 0.903731185572294, "epoch": 77, "test_loss": 0.8763512468246548, "test_acc1": 78.106, "test_acc5": 94.32}
79
+ {"train_lr": 0.0002294867572242191, "train_loss": 0.901658609685091, "epoch": 78, "test_loss": 0.8759333497613592, "test_acc1": 78.11, "test_acc5": 94.324}
80
+ {"train_lr": 0.0002098449876243195, "train_loss": 0.9004192501991166, "epoch": 79, "test_loss": 0.8755727065036364, "test_acc1": 78.192, "test_acc5": 94.354}
81
+ {"train_lr": 0.00019098300562504553, "train_loss": 0.900639298801726, "epoch": 80, "test_loss": 0.8752036135443642, "test_acc1": 78.158, "test_acc5": 94.336}
82
+ {"train_lr": 0.00017291942572544524, "train_loss": 0.8989108591926512, "epoch": 81, "test_loss": 0.8743628890008268, "test_acc1": 78.258, "test_acc5": 94.382}
83
+ {"train_lr": 0.0001556720744979767, "train_loss": 0.8978697478896229, "epoch": 82, "test_loss": 0.8749886486688843, "test_acc1": 78.242, "test_acc5": 94.352}
84
+ {"train_lr": 0.00013925797299606019, "train_loss": 0.8975689940651654, "epoch": 83, "test_loss": 0.8747964766248107, "test_acc1": 78.232, "test_acc5": 94.352}
85
+ {"train_lr": 0.00012369331995613583, "train_loss": 0.8979594122694342, "epoch": 84, "test_loss": 0.874699472733166, "test_acc1": 78.2, "test_acc5": 94.35}
86
+ {"train_lr": 0.00010899347581163435, "train_loss": 0.8969663048875223, "epoch": 85, "test_loss": 0.8747386357287312, "test_acc1": 78.16, "test_acc5": 94.308}
87
+ {"train_lr": 9.5172947533978e-05, "train_loss": 0.8967000352493344, "epoch": 86, "test_loss": 0.874495963192047, "test_acc1": 78.152, "test_acc5": 94.346}
88
+ {"train_lr": 8.224537431602316e-05, "train_loss": 0.8980387321684868, "epoch": 87, "test_loss": 0.8739630047546323, "test_acc1": 78.2, "test_acc5": 94.388}
89
+ {"train_lr": 7.022351411175157e-05, "train_loss": 0.8949271040055878, "epoch": 88, "test_loss": 0.8741501825087515, "test_acc1": 78.226, "test_acc5": 94.366}
90
+ {"train_lr": 5.911923104577377e-05, "train_loss": 0.8943974479372102, "epoch": 89, "test_loss": 0.8739263171430134, "test_acc1": 78.242, "test_acc5": 94.358}
91
+ {"train_lr": 4.8943483704848814e-05, "train_loss": 0.8957436852904258, "epoch": 90, "test_loss": 0.8737455527953175, "test_acc1": 78.226, "test_acc5": 94.354}
92
+ {"train_lr": 3.9706314323055196e-05, "train_loss": 0.8937930382142246, "epoch": 91, "test_loss": 0.8737212545655267, "test_acc1": 78.252, "test_acc5": 94.342}
93
+ {"train_lr": 3.141683887136792e-05, "train_loss": 0.8953395644861415, "epoch": 92, "test_loss": 0.8737035993572391, "test_acc1": 78.252, "test_acc5": 94.352}
94
+ {"train_lr": 2.4083238061252423e-05, "train_loss": 0.8945637361536825, "epoch": 93, "test_loss": 0.8737105267203372, "test_acc1": 78.246, "test_acc5": 94.346}
95
+ {"train_lr": 1.7712749271312274e-05, "train_loss": 0.8935419751634085, "epoch": 94, "test_loss": 0.8736384067389057, "test_acc1": 78.238, "test_acc5": 94.356}
96
+ {"train_lr": 1.2311659404861753e-05, "train_loss": 0.8946735740773591, "epoch": 95, "test_loss": 0.8735849036813697, "test_acc1": 78.24, "test_acc5": 94.34}
97
+ {"train_lr": 7.885298685522277e-06, "train_loss": 0.8929852355796959, "epoch": 96, "test_loss": 0.8736040683658531, "test_acc1": 78.252, "test_acc5": 94.34}
98
+ {"train_lr": 4.4380353969200165e-06, "train_loss": 0.8954210997913725, "epoch": 97, "test_loss": 0.8736254497790885, "test_acc1": 78.268, "test_acc5": 94.342}
99
+ {"train_lr": 1.9732715717283947e-06, "train_loss": 0.892153094175502, "epoch": 98, "test_loss": 0.8736329334395011, "test_acc1": 78.254, "test_acc5": 94.344}
100
+ {"train_lr": 4.934396342684219e-07, "train_loss": 0.8933977404869036, "epoch": 99, "test_loss": 0.8736348381966276, "test_acc1": 78.256, "test_acc5": 94.344}
Vim/Small/checkpoint.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:932e4fa14806c489242d5771060010e58e5636436edfbc276e93ca07f105849b
3
+ size 1007834704
Vim/Small/checkpoint.pth.tar ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68604ebe0327627c9a1521b6648ffa05257c71835134070eaa858af09e8398f4
3
+ size 16394696
Vim/Small/config.txt ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ arch: vim_small_patch16_224
2
+ batch_size_per_gpu: 64
3
+ clip_grad: 3.0
4
+ dist_url:
5
+ drop_path_rate: 0.1
6
+ epochs: 400
7
+ freeze_last_layer: 1
8
+ global_crops_scale: (0.25, 1.0)
9
+ gpu: 0
10
+ local_crops_number: 10
11
+ local_crops_scale: (0.05, 0.25)
12
+ local_rank: 0
13
+ lr: 0.0005
14
+ min_lr: 1e-06
15
+ momentum_teacher: 0.996
16
+ ngpus: 8
17
+ nodes: 2
18
+ norm_last_layer: True
19
+ num_workers: 10
20
+ optimizer: adamw
21
+ out_dim: 65536
22
+ partition: main
23
+ patch_size: 16
24
+ rank: 0
25
+ saveckp_freq: 5
26
+ seed: 0
27
+ teacher_temp: 0.07
28
+ use_bn_in_head: False
29
+ use_fp16: True (bf16)
30
+ use_volta32: False
31
+ warmup_epochs: 10
32
+ warmup_teacher_temp: 0.04
33
+ warmup_teacher_temp_epochs: 30
34
+ weight_decay: 0.04
35
+ weight_decay_end: 0.4
36
+ world_size: 16
Vim/Small/log.txt ADDED
@@ -0,0 +1,400 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"train_loss": 9.891199271795418, "train_lr": 0.00011240893965284647, "train_wd": 0.04000184804963205, "epoch": 0}
2
+ {"train_loss": 9.5973723379435, "train_lr": 0.00033742917528554735, "train_wd": 0.040012946191043855, "epoch": 1}
3
+ {"train_loss": 9.073680406583728, "train_lr": 0.000562449410918248, "train_wd": 0.04003514678174925, "epoch": 2}
4
+ {"train_loss": 7.7527198973212315, "train_lr": 0.0007874696465509491, "train_wd": 0.04006844845231126, "epoch": 3}
5
+ {"train_loss": 6.858771469077761, "train_lr": 0.0010124898821836498, "train_wd": 0.04011284914852605, "epoch": 4}
6
+ {"train_loss": 6.228180805413271, "train_lr": 0.0012375101178163503, "train_wd": 0.04016834613154946, "epoch": 5}
7
+ {"train_loss": 5.828166456924354, "train_lr": 0.0014625303534490516, "train_wd": 0.040234935978066266, "epoch": 6}
8
+ {"train_loss": 5.552261811384051, "train_lr": 0.0016875505890817516, "train_wd": 0.04031261458050099, "epoch": 7}
9
+ {"train_loss": 5.350189290958629, "train_lr": 0.0019125708247144542, "train_wd": 0.04040137714727146, "epoch": 8}
10
+ {"train_loss": 5.206569257417886, "train_lr": 0.0021375910603471525, "train_wd": 0.040501218203084596, "epoch": 9}
11
+ {"train_loss": 5.0857582401922, "train_lr": 0.00224998785517435, "train_wd": 0.040612131589273674, "epoch": 10}
12
+ {"train_loss": 4.988846141049902, "train_lr": 0.002249914921577872, "train_wd": 0.04073411046417868, "epoch": 11}
13
+ {"train_loss": 4.911772376520457, "train_lr": 0.002249769026308481, "train_wd": 0.04086714730356794, "epoch": 12}
14
+ {"train_loss": 4.851678893041553, "train_lr": 0.0022495501788331153, "train_wd": 0.041011233901102694, "epoch": 13}
15
+ {"train_loss": 4.804512802984932, "train_lr": 0.0022492583933524735, "train_wd": 0.041166361368842726, "epoch": 14}
16
+ {"train_loss": 4.768699391917002, "train_lr": 0.0022488936888000887, "train_wd": 0.04133252013779519, "epoch": 15}
17
+ {"train_loss": 4.742429010784455, "train_lr": 0.0022484560888411287, "train_wd": 0.041509699958504516, "epoch": 16}
18
+ {"train_loss": 4.725466685892224, "train_lr": 0.0022479456218708234, "train_wd": 0.04169788990168485, "epoch": 17}
19
+ {"train_loss": 4.7139874233080326, "train_lr": 0.002247362321012642, "train_wd": 0.041897078358893815, "epoch": 18}
20
+ {"train_loss": 4.707533731082861, "train_lr": 0.0022467062241161326, "train_wd": 0.0421072530432495, "epoch": 19}
21
+ {"train_loss": 4.706119315774678, "train_lr": 0.002245977373754498, "train_wd": 0.042328400990186865, "epoch": 20}
22
+ {"train_loss": 4.708116093118914, "train_lr": 0.002245175817221788, "train_wd": 0.042560508558259325, "epoch": 21}
23
+ {"train_loss": 4.712001237714533, "train_lr": 0.002244301606529856, "train_wd": 0.042803561429978494, "epoch": 22}
24
+ {"train_loss": 4.723223430218456, "train_lr": 0.0022433547984049827, "train_wd": 0.043057544612698416, "epoch": 23}
25
+ {"train_loss": 4.741455932297438, "train_lr": 0.002242335454284184, "train_wd": 0.04332244243953986, "epoch": 24}
26
+ {"train_loss": 4.756836122201143, "train_lr": 0.0022412436403112497, "train_wd": 0.04359823857035742, "epoch": 25}
27
+ {"train_loss": 4.781607317615399, "train_lr": 0.002240079427332412, "train_wd": 0.04388491599274647, "epoch": 26}
28
+ {"train_loss": 4.813056948927524, "train_lr": 0.002238842890891801, "train_wd": 0.04418245702309301, "epoch": 27}
29
+ {"train_loss": 4.847504815788006, "train_lr": 0.002237534111226471, "train_wd": 0.044490843307665055, "epoch": 28}
30
+ {"train_loss": 4.8941699212832415, "train_lr": 0.0022361531732612732, "train_wd": 0.04481005582374382, "epoch": 29}
31
+ {"train_loss": 4.897879076313129, "train_lr": 0.0022347001666032946, "train_wd": 0.04514007488079763, "epoch": 30}
32
+ {"train_loss": 4.902579244958768, "train_lr": 0.0022331751855360475, "train_wd": 0.04548088012169672, "epoch": 31}
33
+ {"train_loss": 4.90696275837237, "train_lr": 0.002231578329013376, "train_wd": 0.045832450523968234, "epoch": 32}
34
+ {"train_loss": 4.939746108790525, "train_lr": 0.0022299097006530056, "train_wd": 0.046194764401093935, "epoch": 33}
35
+ {"train_loss": 4.926793028410676, "train_lr": 0.0022281694087298316, "train_wd": 0.04656779940384704, "epoch": 34}
36
+ {"train_loss": 4.932746611767821, "train_lr": 0.0022263575661689216, "train_wd": 0.046951532521671516, "epoch": 35}
37
+ {"train_loss": 4.967408751823204, "train_lr": 0.002224474290538131, "train_wd": 0.04734594008410122, "epoch": 36}
38
+ {"train_loss": 5.014066947557086, "train_lr": 0.002222519704040518, "train_wd": 0.04775099776221966, "epoch": 37}
39
+ {"train_loss": 5.053495651097607, "train_lr": 0.0022204939335063963, "train_wd": 0.048166680570161456, "epoch": 38}
40
+ {"train_loss": 5.077481628563121, "train_lr": 0.0022183971103851238, "train_wd": 0.048592962866652885, "epoch": 39}
41
+ {"train_loss": 5.090614873719373, "train_lr": 0.0022162293707365375, "train_wd": 0.04902981835659392, "epoch": 40}
42
+ {"train_loss": 5.099656534387911, "train_lr": 0.0022139908552221608, "train_wd": 0.049477220092680206, "epoch": 41}
43
+ {"train_loss": 5.102793878288292, "train_lr": 0.0022116817090960536, "train_wd": 0.049935140477065126, "epoch": 42}
44
+ {"train_loss": 5.103122014811428, "train_lr": 0.0022093020821954096, "train_wd": 0.050403551263062424, "epoch": 43}
45
+ {"train_loss": 5.105584094421469, "train_lr": 0.00220685212893079, "train_wd": 0.0508824235568884, "epoch": 44}
46
+ {"train_loss": 5.101845648336253, "train_lr": 0.0022043320082761756, "train_wd": 0.05137172781944444, "epoch": 45}
47
+ {"train_loss": 5.100284054250025, "train_lr": 0.0022017418837585634, "train_wd": 0.051871433868138445, "epoch": 46}
48
+ {"train_loss": 5.089728962665768, "train_lr": 0.0021990819234474286, "train_wd": 0.05238151087874799, "epoch": 47}
49
+ {"train_loss": 5.0817803965805535, "train_lr": 0.002196352299943785, "train_wd": 0.052901927387319865, "epoch": 48}
50
+ {"train_loss": 5.086416789015635, "train_lr": 0.0021935531903689853, "train_wd": 0.053432651292112866, "epoch": 49}
51
+ {"train_loss": 5.094888877525604, "train_lr": 0.002190684776353248, "train_wd": 0.05397364985557633, "epoch": 50}
52
+ {"train_loss": 5.1006680333035455, "train_lr": 0.002187747244023839, "train_wd": 0.05452488970637067, "epoch": 51}
53
+ {"train_loss": 5.1057985527195235, "train_lr": 0.002184740783993028, "train_wd": 0.05508633684142527, "epoch": 52}
54
+ {"train_loss": 5.11928050439778, "train_lr": 0.0021816655913456913, "train_wd": 0.05565795662803626, "epoch": 53}
55
+ {"train_loss": 5.129029909126478, "train_lr": 0.0021785218656266737, "train_wd": 0.05623971380600251, "epoch": 54}
56
+ {"train_loss": 5.131504016367795, "train_lr": 0.002175309810827842, "train_wd": 0.056831572489801044, "epoch": 55}
57
+ {"train_loss": 5.133396216916094, "train_lr": 0.002172029635374821, "train_wd": 0.05743349617080036, "epoch": 56}
58
+ {"train_loss": 5.13463795277998, "train_lr": 0.0021686815521134934, "train_wd": 0.05804544771951252, "epoch": 57}
59
+ {"train_loss": 5.130762478734235, "train_lr": 0.0021652657782961888, "train_wd": 0.058667389387883184, "epoch": 58}
60
+ {"train_loss": 5.124997974085293, "train_lr": 0.0021617825355675704, "train_wd": 0.059299282811621036, "epoch": 59}
61
+ {"train_loss": 5.154246819837631, "train_lr": 0.0021582320499502717, "train_wd": 0.05994108901256308, "epoch": 60}
62
+ {"train_loss": 5.112774317481106, "train_lr": 0.0021546145518302117, "train_wd": 0.060592768401079425, "epoch": 61}
63
+ {"train_loss": 5.11256169676066, "train_lr": 0.002150930275941669, "train_wd": 0.06125428077851599, "epoch": 62}
64
+ {"train_loss": 5.111878907187379, "train_lr": 0.002147179461352007, "train_wd": 0.06192558533967335, "epoch": 63}
65
+ {"train_loss": 5.113865970421752, "train_lr": 0.002143362351446228, "train_wd": 0.06260664067532365, "epoch": 64}
66
+ {"train_loss": 5.114117870084959, "train_lr": 0.0021394791939111186, "train_wd": 0.06329740477476624, "epoch": 65}
67
+ {"train_loss": 5.113238768147336, "train_lr": 0.0021355302407192033, "train_wd": 0.06399783502841726, "epoch": 66}
68
+ {"train_loss": 5.111505580963277, "train_lr": 0.002131515748112402, "train_wd": 0.0647078882304398, "epoch": 67}
69
+ {"train_loss": 5.107590312544676, "train_lr": 0.0021274359765853772, "train_wd": 0.06542752058140736, "epoch": 68}
70
+ {"train_loss": 5.10867228032016, "train_lr": 0.002123291190868668, "train_wd": 0.06615668769100679, "epoch": 69}
71
+ {"train_loss": 5.109139443640943, "train_lr": 0.0021190816599114598, "train_wd": 0.0668953445807762, "epoch": 70}
72
+ {"train_loss": 5.111809980829985, "train_lr": 0.0021148076568642113, "train_wd": 0.06764344568687908, "epoch": 71}
73
+ {"train_loss": 5.112491459922968, "train_lr": 0.002110469459060837, "train_wd": 0.06840094486291547, "epoch": 72}
74
+ {"train_loss": 5.10588596155532, "train_lr": 0.0021060673480007845, "train_wd": 0.06916779538276807, "epoch": 73}
75
+ {"train_loss": 5.109031590733597, "train_lr": 0.0021016016093307224, "train_wd": 0.06994394994348456, "epoch": 74}
76
+ {"train_loss": 5.107657144717176, "train_lr": 0.00209707253282604, "train_wd": 0.0707293606681956, "epoch": 75}
77
+ {"train_loss": 5.108343432614986, "train_lr": 0.002092480412372023, "train_wd": 0.07152397910906821, "epoch": 76}
78
+ {"train_loss": 5.109115054674572, "train_lr": 0.0020878255459447852, "train_wd": 0.07232775625029378, "epoch": 77}
79
+ {"train_loss": 5.108969321836241, "train_lr": 0.0020831082355919333, "train_wd": 0.07314064251111234, "epoch": 78}
80
+ {"train_loss": 5.110082272216856, "train_lr": 0.0020783287874129846, "train_wd": 0.07396258774886999, "epoch": 79}
81
+ {"train_loss": 5.110463185651268, "train_lr": 0.0020734875115394733, "train_wd": 0.07479354126211303, "epoch": 80}
82
+ {"train_loss": 5.110531678374151, "train_lr": 0.0020685847221148567, "train_wd": 0.07563345179371445, "epoch": 81}
83
+ {"train_loss": 5.112849600541649, "train_lr": 0.0020636207372741176, "train_wd": 0.07648226753403647, "epoch": 82}
84
+ {"train_loss": 5.113088597711042, "train_lr": 0.0020585958791231136, "train_wd": 0.07733993612412579, "epoch": 83}
85
+ {"train_loss": 5.113309768928612, "train_lr": 0.0020535104737176967, "train_wd": 0.07820640465894399, "epoch": 84}
86
+ {"train_loss": 5.1751034421850735, "train_lr": 0.0020483648510425246, "train_wd": 0.07908161969063034, "epoch": 85}
87
+ {"train_loss": 5.120830223482432, "train_lr": 0.0020431593449896897, "train_wd": 0.07996552723179881, "epoch": 86}
88
+ {"train_loss": 5.120273708385958, "train_lr": 0.002037894293337015, "train_wd": 0.08085807275886897, "epoch": 87}
89
+ {"train_loss": 5.14396550175812, "train_lr": 0.002032570037726157, "train_wd": 0.08175920121542826, "epoch": 88}
90
+ {"train_loss": 5.124640809010259, "train_lr": 0.002027186923640429, "train_wd": 0.08266885701562902, "epoch": 89}
91
+ {"train_loss": 5.125454128842702, "train_lr": 0.002021745300382401, "train_wd": 0.0835869840476164, "epoch": 90}
92
+ {"train_loss": 5.128255861751039, "train_lr": 0.002016245521051194, "train_wd": 0.08451352567699047, "epoch": 91}
93
+ {"train_loss": 5.127965825656764, "train_lr": 0.00201068794251962, "train_wd": 0.08544842475029914, "epoch": 92}
94
+ {"train_loss": 5.130129556307833, "train_lr": 0.002005072925410979, "train_wd": 0.0863916235985636, "epoch": 93}
95
+ {"train_loss": 5.135595977485037, "train_lr": 0.001999400834075681, "train_wd": 0.08734306404083615, "epoch": 94}
96
+ {"train_loss": 5.132060706454644, "train_lr": 0.001993672036567612, "train_wd": 0.08830268738778872, "epoch": 95}
97
+ {"train_loss": 5.135390626655208, "train_lr": 0.0019878869046202254, "train_wd": 0.08927043444533281, "epoch": 96}
98
+ {"train_loss": 5.137153720416182, "train_lr": 0.001982045813622449, "train_wd": 0.09024624551827173, "epoch": 97}
99
+ {"train_loss": 5.14193490835474, "train_lr": 0.0019761491425943018, "train_wd": 0.09123006041398163, "epoch": 98}
100
+ {"train_loss": 5.139173849809656, "train_lr": 0.0019701972741623243, "train_wd": 0.09222181844612586, "epoch": 99}
101
+ {"train_loss": 5.140231019104842, "train_lr": 0.001964190594534725, "train_wd": 0.09322145843839738, "epoch": 100}
102
+ {"train_loss": 5.14518040917117, "train_lr": 0.0019581294934763317, "train_wd": 0.09422891872829245, "epoch": 101}
103
+ {"train_loss": 5.147588141744943, "train_lr": 0.0019520143642833164, "train_wd": 0.09524413717091516, "epoch": 102}
104
+ {"train_loss": 5.151189850960418, "train_lr": 0.001945845603757641, "train_wd": 0.09626705114280987, "epoch": 103}
105
+ {"train_loss": 5.153369373197464, "train_lr": 0.0019396236121813385, "train_wd": 0.0972975975458242, "epoch": 104}
106
+ {"train_loss": 5.153484287271969, "train_lr": 0.0019333487932905236, "train_wd": 0.09833571281100173, "epoch": 105}
107
+ {"train_loss": 5.155888468295121, "train_lr": 0.0019270215542492117, "train_wd": 0.09938133290250328, "epoch": 106}
108
+ {"train_loss": 5.157620319198791, "train_lr": 0.0019206423056228657, "train_wd": 0.10043439332155589, "epoch": 107}
109
+ {"train_loss": 5.158929239878122, "train_lr": 0.0019142114613517878, "train_wd": 0.10149482911043275, "epoch": 108}
110
+ {"train_loss": 5.171671258316909, "train_lr": 0.001907729438724256, "train_wd": 0.10256257485645953, "epoch": 109}
111
+ {"train_loss": 5.161017376366708, "train_lr": 0.0019011966583494214, "train_wd": 0.1036375646960484, "epoch": 110}
112
+ {"train_loss": 5.165433323926491, "train_lr": 0.0018946135441300423, "train_wd": 0.10471973231876283, "epoch": 111}
113
+ {"train_loss": 5.17118961135332, "train_lr": 0.001887980523234967, "train_wd": 0.10580901097140671, "epoch": 112}
114
+ {"train_loss": 5.174196094578262, "train_lr": 0.0018812980260714182, "train_wd": 0.10690533346214137, "epoch": 113}
115
+ {"train_loss": 5.170867326019479, "train_lr": 0.0018745664862570574, "train_wd": 0.10800863216463152, "epoch": 114}
116
+ {"train_loss": 5.174493308083044, "train_lr": 0.0018677863405918607, "train_wd": 0.10911883902221604, "epoch": 115}
117
+ {"train_loss": 5.176568635540614, "train_lr": 0.001860958029029756, "train_wd": 0.11023588555210692, "epoch": 116}
118
+ {"train_loss": 5.178822325323697, "train_lr": 0.001854081994650105, "train_wd": 0.1113597028496118, "epoch": 117}
119
+ {"train_loss": 5.1818589812560045, "train_lr": 0.001847158683628916, "train_wd": 0.11249022159238631, "epoch": 118}
120
+ {"train_loss": 5.1838316946900145, "train_lr": 0.0018401885452099223, "train_wd": 0.1136273720447094, "epoch": 119}
121
+ {"train_loss": 5.1840418551108245, "train_lr": 0.0018331720316754193, "train_wd": 0.11477108406178468, "epoch": 120}
122
+ {"train_loss": 5.186170782188146, "train_lr": 0.0018261095983169158, "train_wd": 0.11592128709406752, "epoch": 121}
123
+ {"train_loss": 5.213695119896667, "train_lr": 0.0018190017034055916, "train_wd": 0.11707791019161676, "epoch": 122}
124
+ {"train_loss": 5.187233262335797, "train_lr": 0.0018118488081625569, "train_wd": 0.11824088200847166, "epoch": 123}
125
+ {"train_loss": 5.192278328219906, "train_lr": 0.0018046513767289386, "train_wd": 0.11941013080705261, "epoch": 124}
126
+ {"train_loss": 5.196099772084531, "train_lr": 0.0017974098761357451, "train_wd": 0.12058558446258585, "epoch": 125}
127
+ {"train_loss": 5.196388436039146, "train_lr": 0.0017901247762735744, "train_wd": 0.12176717046755348, "epoch": 126}
128
+ {"train_loss": 5.197198032636008, "train_lr": 0.001782796549862115, "train_wd": 0.1229548159361643, "epoch": 127}
129
+ {"train_loss": 5.199195358714611, "train_lr": 0.0017754256724194784, "train_wd": 0.12414844760885205, "epoch": 128}
130
+ {"train_loss": 5.200391364469231, "train_lr": 0.0017680126222313363, "train_wd": 0.12534799185679213, "epoch": 129}
131
+ {"train_loss": 5.204034713496693, "train_lr": 0.001760557880319897, "train_wd": 0.1265533746864453, "epoch": 130}
132
+ {"train_loss": 5.205680902127168, "train_lr": 0.0017530619304126761, "train_wd": 0.127764521744121, "epoch": 131}
133
+ {"train_loss": 5.20715323240637, "train_lr": 0.0017455252589111201, "train_wd": 0.12898135832056315, "epoch": 132}
134
+ {"train_loss": 5.210350695917074, "train_lr": 0.0017379483548590475, "train_wd": 0.13020380935556003, "epoch": 133}
135
+ {"train_loss": 5.211882775475224, "train_lr": 0.0017303317099108988, "train_wd": 0.1314317994425741, "epoch": 134}
136
+ {"train_loss": 5.22293084859848, "train_lr": 0.0017226758182998507, "train_wd": 0.13266525283339178, "epoch": 135}
137
+ {"train_loss": 5.210758210139738, "train_lr": 0.001714981176805742, "train_wd": 0.1339040934427984, "epoch": 136}
138
+ {"train_loss": 5.214704577371085, "train_lr": 0.0017072482847228284, "train_wd": 0.135148244853269, "epoch": 137}
139
+ {"train_loss": 5.218287415784611, "train_lr": 0.0016994776438273955, "train_wd": 0.1363976303196845, "epoch": 138}
140
+ {"train_loss": 5.220372045318857, "train_lr": 0.0016916697583451972, "train_wd": 0.13765217277406447, "epoch": 139}
141
+ {"train_loss": 5.218799246229428, "train_lr": 0.001683825134918733, "train_wd": 0.1389117948303205, "epoch": 140}
142
+ {"train_loss": 5.220070712536359, "train_lr": 0.0016759442825743753, "train_wd": 0.14017641878903087, "epoch": 141}
143
+ {"train_loss": 5.22048305904122, "train_lr": 0.0016680277126893414, "train_wd": 0.14144596664223327, "epoch": 142}
144
+ {"train_loss": 5.22231460121467, "train_lr": 0.0016600759389584988, "train_wd": 0.14272036007823552, "epoch": 143}
145
+ {"train_loss": 5.2232158905525, "train_lr": 0.001652089477361057, "train_wd": 0.14399952048644757, "epoch": 144}
146
+ {"train_loss": 5.2248708029731, "train_lr": 0.001644068846127063, "train_wd": 0.1452833689622306, "epoch": 145}
147
+ {"train_loss": 5.2260129793728, "train_lr": 0.001636014565703778, "train_wd": 0.14657182631176244, "epoch": 146}
148
+ {"train_loss": 5.228380132993634, "train_lr": 0.001627927158721923, "train_wd": 0.14786481305692498, "epoch": 147}
149
+ {"train_loss": 5.226925445867957, "train_lr": 0.0016198071499617427, "train_wd": 0.1491622494402055, "epoch": 148}
150
+ {"train_loss": 5.230628825223846, "train_lr": 0.0016116550663189746, "train_wd": 0.15046405542961588, "epoch": 149}
151
+ {"train_loss": 5.230576059801115, "train_lr": 0.0016034714367706368, "train_wd": 0.1517701507236311, "epoch": 150}
152
+ {"train_loss": 5.232340854635056, "train_lr": 0.0015952567923407282, "train_wd": 0.1530804547561409, "epoch": 151}
153
+ {"train_loss": 5.2346243103631105, "train_lr": 0.0015870116660657537, "train_wd": 0.1543948867014205, "epoch": 152}
154
+ {"train_loss": 5.2348252197892835, "train_lr": 0.0015787365929601374, "train_wd": 0.155713365479116, "epoch": 153}
155
+ {"train_loss": 5.236613237243191, "train_lr": 0.001570432109981519, "train_wd": 0.15703580975924591, "epoch": 154}
156
+ {"train_loss": 5.235389357758797, "train_lr": 0.0015620987559958961, "train_wd": 0.15836213796721774, "epoch": 155}
157
+ {"train_loss": 5.2366490202020115, "train_lr": 0.001553737071742669, "train_wd": 0.15969226828885974, "epoch": 156}
158
+ {"train_loss": 5.237074780771486, "train_lr": 0.0015453475997995406, "train_wd": 0.16102611867546912, "epoch": 157}
159
+ {"train_loss": 5.239736160821766, "train_lr": 0.00153693088454733, "train_wd": 0.1623636068488698, "epoch": 158}
160
+ {"train_loss": 5.248110405582604, "train_lr": 0.0015284874721346218, "train_wd": 0.16370465030649164, "epoch": 159}
161
+ {"train_loss": 5.238684097711417, "train_lr": 0.0015200179104423513, "train_wd": 0.16504916632645733, "epoch": 160}
162
+ {"train_loss": 5.241968135771563, "train_lr": 0.0015115227490482379, "train_wd": 0.16639707197268594, "epoch": 161}
163
+ {"train_loss": 5.242491885483694, "train_lr": 0.0015030025391911306, "train_wd": 0.16774828410000767, "epoch": 162}
164
+ {"train_loss": 5.265134109367284, "train_lr": 0.0014944578337352358, "train_wd": 0.1691027193592933, "epoch": 163}
165
+ {"train_loss": 5.243678727703129, "train_lr": 0.001485889187134251, "train_wd": 0.17046029420259676, "epoch": 164}
166
+ {"train_loss": 5.245903512753314, "train_lr": 0.0014772971553953706, "train_wd": 0.17182092488830647, "epoch": 165}
167
+ {"train_loss": 5.247507754007547, "train_lr": 0.0014686822960432177, "train_wd": 0.17318452748631258, "epoch": 166}
168
+ {"train_loss": 5.249220731125461, "train_lr": 0.001460045168083676, "train_wd": 0.17455101788318408, "epoch": 167}
169
+ {"train_loss": 5.248228075031897, "train_lr": 0.0014513863319676017, "train_wd": 0.17592031178735662, "epoch": 168}
170
+ {"train_loss": 5.24664253727209, "train_lr": 0.0014427063495544542, "train_wd": 0.17729232473433176, "epoch": 169}
171
+ {"train_loss": 5.246017999482526, "train_lr": 0.00143400578407586, "train_wd": 0.17866697209188823, "epoch": 170}
172
+ {"train_loss": 5.246341891425977, "train_lr": 0.0014252852000990466, "train_wd": 0.18004416906530218, "epoch": 171}
173
+ {"train_loss": 5.248802040835365, "train_lr": 0.0014165451634902053, "train_wd": 0.181423830702577, "epoch": 172}
174
+ {"train_loss": 5.248038672178769, "train_lr": 0.0014077862413777898, "train_wd": 0.18280587189968386, "epoch": 173}
175
+ {"train_loss": 5.248076795066575, "train_lr": 0.0013990090021157005, "train_wd": 0.1841902074058122, "epoch": 174}
176
+ {"train_loss": 5.2474407876173945, "train_lr": 0.0013902140152464205, "train_wd": 0.18557675182862676, "epoch": 175}
177
+ {"train_loss": 5.248629381366485, "train_lr": 0.00138140185146404, "train_wd": 0.18696541963953647, "epoch": 176}
178
+ {"train_loss": 5.249356719051048, "train_lr": 0.0013725730825772415, "train_wd": 0.1883561251789694, "epoch": 177}
179
+ {"train_loss": 5.249669514560728, "train_lr": 0.0013637282814721854, "train_wd": 0.18974878266165804, "epoch": 178}
180
+ {"train_loss": 5.249930986058083, "train_lr": 0.0013548680220753357, "train_wd": 0.1911433061819274, "epoch": 179}
181
+ {"train_loss": 5.24908554668335, "train_lr": 0.0013459928793162314, "train_wd": 0.19253960971899864, "epoch": 180}
182
+ {"train_loss": 5.249612451921836, "train_lr": 0.0013371034290901656, "train_wd": 0.19393760714229263, "epoch": 181}
183
+ {"train_loss": 5.268937307581913, "train_lr": 0.0013282002482208257, "train_wd": 0.19533721221674286, "epoch": 182}
184
+ {"train_loss": 5.246443628568015, "train_lr": 0.0013192839144228591, "train_wd": 0.19673833860811532, "epoch": 183}
185
+ {"train_loss": 5.249958403890939, "train_lr": 0.001310355006264392, "train_wd": 0.19814089988833497, "epoch": 184}
186
+ {"train_loss": 5.24962667431191, "train_lr": 0.0013014141031294723, "train_wd": 0.19954480954081513, "epoch": 185}
187
+ {"train_loss": 5.2482702482840144, "train_lr": 0.0012924617851804985, "train_wd": 0.20094998096579542, "epoch": 186}
188
+ {"train_loss": 5.25966331832629, "train_lr": 0.0012834986333205485, "train_wd": 0.20235632748568294, "epoch": 187}
189
+ {"train_loss": 5.250594736467734, "train_lr": 0.0012745252291557032, "train_wd": 0.2037637623504005, "epoch": 188}
190
+ {"train_loss": 5.246219114880625, "train_lr": 0.0012655421549572995, "train_wd": 0.20517219874273612, "epoch": 189}
191
+ {"train_loss": 5.246738840636017, "train_lr": 0.0012565499936241522, "train_wd": 0.2065815497836978, "epoch": 190}
192
+ {"train_loss": 5.248329286363056, "train_lr": 0.001247549328644715, "train_wd": 0.2079917285378759, "epoch": 191}
193
+ {"train_loss": 5.246703330329139, "train_lr": 0.0012385407440592489, "train_wd": 0.20940264801880148, "epoch": 192}
194
+ {"train_loss": 5.246316834033536, "train_lr": 0.001229524824421893, "train_wd": 0.21081422119431556, "epoch": 193}
195
+ {"train_loss": 5.247743306078499, "train_lr": 0.0012205021547627524, "train_wd": 0.21222636099193462, "epoch": 194}
196
+ {"train_loss": 5.245447532343064, "train_lr": 0.001211473320549938, "train_wd": 0.2136389803042259, "epoch": 195}
197
+ {"train_loss": 5.243874298690034, "train_lr": 0.0012024389076515523, "train_wd": 0.215051991994174, "epoch": 196}
198
+ {"train_loss": 5.242583936888823, "train_lr": 0.0011933995022977094, "train_wd": 0.21646530890056367, "epoch": 197}
199
+ {"train_loss": 5.241789544318363, "train_lr": 0.0011843556910424652, "train_wd": 0.21787884384335007, "epoch": 198}
200
+ {"train_loss": 5.24216862735774, "train_lr": 0.001175308060725774, "train_wd": 0.2192925096290399, "epoch": 199}
201
+ {"train_loss": 5.240163515047204, "train_lr": 0.0011662571984354, "train_wd": 0.22070621905606813, "epoch": 200}
202
+ {"train_loss": 5.239865322907765, "train_lr": 0.001157203691468823, "train_wd": 0.22211988492017867, "epoch": 201}
203
+ {"train_loss": 5.246181382656955, "train_lr": 0.0011481481272951433, "train_wd": 0.22353342001980173, "epoch": 202}
204
+ {"train_loss": 5.238502755796881, "train_lr": 0.0011390910935169393, "train_wd": 0.22494673716143385, "epoch": 203}
205
+ {"train_loss": 5.239301754755797, "train_lr": 0.0011300331778321534, "train_wd": 0.22635974916501672, "epoch": 204}
206
+ {"train_loss": 5.23753531768525, "train_lr": 0.001120974967995955, "train_wd": 0.22777236886931443, "epoch": 205}
207
+ {"train_loss": 5.2392446062297555, "train_lr": 0.0011119170517825965, "train_wd": 0.2291845091372883, "epoch": 206}
208
+ {"train_loss": 5.240045312229249, "train_lr": 0.0011028600169472845, "train_wd": 0.23059608286147626, "epoch": 207}
209
+ {"train_loss": 5.235061264884987, "train_lr": 0.001093804451188027, "train_wd": 0.23200700296936133, "epoch": 208}
210
+ {"train_loss": 5.230883718573218, "train_lr": 0.001084750942107513, "train_wd": 0.2334171824287453, "epoch": 209}
211
+ {"train_loss": 5.230550956919039, "train_lr": 0.0010757000771749689, "train_wd": 0.2348265342531161, "epoch": 210}
212
+ {"train_loss": 5.233948881713321, "train_lr": 0.001066652443688048, "train_wd": 0.23623497150701492, "epoch": 211}
213
+ {"train_loss": 5.228924321524388, "train_lr": 0.001057608628734727, "train_wd": 0.23764240731139813, "epoch": 212}
214
+ {"train_loss": 5.228865062697328, "train_lr": 0.0010485692191551956, "train_wd": 0.23904875484899504, "epoch": 213}
215
+ {"train_loss": 5.223777828403085, "train_lr": 0.0010395348015037867, "train_wd": 0.240453927369665, "epoch": 214}
216
+ {"train_loss": 5.223885962949526, "train_lr": 0.0010305059620109155, "train_wd": 0.2418578381957484, "epoch": 215}
217
+ {"train_loss": 5.222076347816905, "train_lr": 0.0010214832865450365, "train_wd": 0.243260400727412, "epoch": 216}
218
+ {"train_loss": 5.220514607408064, "train_lr": 0.001012467360574633, "train_wd": 0.2446615284479924, "epoch": 217}
219
+ {"train_loss": 5.216632046859613, "train_lr": 0.0010034587691302177, "train_wd": 0.24606113492933324, "epoch": 218}
220
+ {"train_loss": 5.217693198052385, "train_lr": 0.0009944580967663863, "train_wd": 0.24745913383711168, "epoch": 219}
221
+ {"train_loss": 5.213712047740853, "train_lr": 0.000985465927523861, "train_wd": 0.24885543893617093, "epoch": 220}
222
+ {"train_loss": 5.212247799626358, "train_lr": 0.0009764828448916234, "train_wd": 0.25024996409583516, "epoch": 221}
223
+ {"train_loss": 5.211574875104199, "train_lr": 0.0009675094317690324, "train_wd": 0.2516426232952242, "epoch": 222}
224
+ {"train_loss": 5.207745313036928, "train_lr": 0.0009585462704280014, "train_wd": 0.2530333306285578, "epoch": 223}
225
+ {"train_loss": 5.204713953574069, "train_lr": 0.0009495939424752312, "train_wd": 0.25442200031045825, "epoch": 224}
226
+ {"train_loss": 5.2040555598995955, "train_lr": 0.0009406530288144493, "train_wd": 0.25580854668123715, "epoch": 225}
227
+ {"train_loss": 5.200214271083009, "train_lr": 0.0009317241096087309, "train_wd": 0.25719288421218367, "epoch": 226}
228
+ {"train_loss": 5.198365746856593, "train_lr": 0.0009228077642428482, "train_wd": 0.2585749275108371, "epoch": 227}
229
+ {"train_loss": 5.196459935473309, "train_lr": 0.0009139045712856744, "train_wd": 0.25995459132625814, "epoch": 228}
230
+ {"train_loss": 5.193586488135999, "train_lr": 0.0009050151084526453, "train_wd": 0.2613317905542832, "epoch": 229}
231
+ {"train_loss": 5.192482487778727, "train_lr": 0.0008961399525682577, "train_wd": 0.26270644024277673, "epoch": 230}
232
+ {"train_loss": 5.189850364246672, "train_lr": 0.0008872796795286629, "train_wd": 0.26407845559687093, "epoch": 231}
233
+ {"train_loss": 5.191331559341017, "train_lr": 0.0008784348642642826, "train_wd": 0.2654477519841947, "epoch": 232}
234
+ {"train_loss": 5.18354903554602, "train_lr": 0.0008696060807024997, "train_wd": 0.26681424494009987, "epoch": 233}
235
+ {"train_loss": 5.183110127900001, "train_lr": 0.00086079390173043, "train_wd": 0.2681778501728609, "epoch": 234}
236
+ {"train_loss": 5.17821652367175, "train_lr": 0.0008519988991577397, "train_wd": 0.26953848356888627, "epoch": 235}
237
+ {"train_loss": 5.177241102790089, "train_lr": 0.0008432216436795386, "train_wd": 0.2708960611978976, "epoch": 236}
238
+ {"train_loss": 5.174622281010059, "train_lr": 0.0008344627048393617, "train_wd": 0.2722504993181121, "epoch": 237}
239
+ {"train_loss": 5.173415968690416, "train_lr": 0.0008257226509921929, "train_wd": 0.273601714381407, "epoch": 238}
240
+ {"train_loss": 5.1680878972907145, "train_lr": 0.0008170020492676029, "train_wd": 0.2749496230384729, "epoch": 239}
241
+ {"train_loss": 5.164013653135986, "train_lr": 0.0008083014655329421, "train_wd": 0.27629414214395365, "epoch": 240}
242
+ {"train_loss": 5.162700611159956, "train_lr": 0.0007996214643566214, "train_wd": 0.2776351887615773, "epoch": 241}
243
+ {"train_loss": 5.1572621002686105, "train_lr": 0.0007909626089714731, "train_wd": 0.27897268016927246, "epoch": 242}
244
+ {"train_loss": 5.157746931899794, "train_lr": 0.0007823254612382202, "train_wd": 0.28030653386426885, "epoch": 243}
245
+ {"train_loss": 5.153260917775779, "train_lr": 0.0007737105816089987, "train_wd": 0.28163666756818706, "epoch": 244}
246
+ {"train_loss": 5.151542177213896, "train_lr": 0.0007651185290910018, "train_wd": 0.2829629992321151, "epoch": 245}
247
+ {"train_loss": 5.147223839228102, "train_lr": 0.0007565498612102066, "train_wd": 0.28428544704166875, "epoch": 246}
248
+ {"train_loss": 5.144464701146102, "train_lr": 0.0007480051339751896, "train_wd": 0.2856039294220365, "epoch": 247}
249
+ {"train_loss": 5.141471196332281, "train_lr": 0.000739484901841061, "train_wd": 0.28691836504301615, "epoch": 248}
250
+ {"train_loss": 5.135951406967869, "train_lr": 0.0007309897176734693, "train_wd": 0.28822867282402626, "epoch": 249}
251
+ {"train_loss": 5.132794423587174, "train_lr": 0.0007225201327127413, "train_wd": 0.2895347719391108, "epoch": 250}
252
+ {"train_loss": 5.129634815851133, "train_lr": 0.0007140766965381088, "train_wd": 0.2908365818219235, "epoch": 251}
253
+ {"train_loss": 5.1264936969541814, "train_lr": 0.0007056599570320476, "train_wd": 0.2921340221707002, "epoch": 252}
254
+ {"train_loss": 5.123294545002549, "train_lr": 0.0006972704603447194, "train_wd": 0.29342701295320767, "epoch": 253}
255
+ {"train_loss": 5.118747015704783, "train_lr": 0.000688908750858541, "train_wd": 0.2947154744116834, "epoch": 254}
256
+ {"train_loss": 5.116760482515791, "train_lr": 0.0006805753711528615, "train_wd": 0.29599932706775656, "epoch": 255}
257
+ {"train_loss": 5.1115352040786535, "train_lr": 0.000672270861968746, "train_wd": 0.2972784917273478, "epoch": 256}
258
+ {"train_loss": 5.108601342306006, "train_lr": 0.000663995762173894, "train_wd": 0.2985528894855546, "epoch": 257}
259
+ {"train_loss": 5.104100684950248, "train_lr": 0.0006557506087276733, "train_wd": 0.2998224417315206, "epoch": 258}
260
+ {"train_loss": 5.099522311160032, "train_lr": 0.0006475359366462767, "train_wd": 0.3010870701532833, "epoch": 259}
261
+ {"train_loss": 5.0968322751047515, "train_lr": 0.0006393522789679998, "train_wd": 0.30234669674260584, "epoch": 260}
262
+ {"train_loss": 5.0916343175357195, "train_lr": 0.000631200166718664, "train_wd": 0.30360124379978454, "epoch": 261}
263
+ {"train_loss": 5.086972196432327, "train_lr": 0.0006230801288771511, "train_wd": 0.3048506339384491, "epoch": 262}
264
+ {"train_loss": 5.084279034849551, "train_lr": 0.0006149926923410799, "train_wd": 0.3060947900903297, "epoch": 263}
265
+ {"train_loss": 5.079666579655892, "train_lr": 0.0006069383818926166, "train_wd": 0.30733363551001563, "epoch": 264}
266
+ {"train_loss": 5.075444788580461, "train_lr": 0.0005989177201644268, "train_wd": 0.3085670937796844, "epoch": 265}
267
+ {"train_loss": 5.071022945762181, "train_lr": 0.0005909312276057509, "train_wd": 0.3097950888138203, "epoch": 266}
268
+ {"train_loss": 5.066316359566985, "train_lr": 0.000582979422448649, "train_wd": 0.31101754486390704, "epoch": 267}
269
+ {"train_loss": 5.062460259532185, "train_lr": 0.0005750628206743634, "train_wd": 0.31223438652309454, "epoch": 268}
270
+ {"train_loss": 5.057960262973245, "train_lr": 0.0005671819359798356, "train_wd": 0.3134455387308588, "epoch": 269}
271
+ {"train_loss": 5.052473096270784, "train_lr": 0.0005593372797443834, "train_wd": 0.31465092677762657, "epoch": 270}
272
+ {"train_loss": 5.047529601293216, "train_lr": 0.0005515293609965032, "train_wd": 0.3158504763093845, "epoch": 271}
273
+ {"train_loss": 5.04287888278528, "train_lr": 0.0005437586863808581, "train_wd": 0.31704411333226823, "epoch": 272}
274
+ {"train_loss": 5.039122479639465, "train_lr": 0.0005360257601253846, "train_wd": 0.31823176421712257, "epoch": 273}
275
+ {"train_loss": 5.032568960077614, "train_lr": 0.0005283310840085874, "train_wd": 0.3194133557040474, "epoch": 274}
276
+ {"train_loss": 5.029537017468354, "train_lr": 0.0005206751573269736, "train_wd": 0.32058881490691377, "epoch": 275}
277
+ {"train_loss": 5.023634619671378, "train_lr": 0.0005130584768626509, "train_wd": 0.32175806931786083, "epoch": 276}
278
+ {"train_loss": 5.020646529303466, "train_lr": 0.0005054815368511033, "train_wd": 0.3229210468117691, "epoch": 277}
279
+ {"train_loss": 5.016135177720222, "train_lr": 0.0004979448289491085, "train_wd": 0.3240776756507079, "epoch": 278}
280
+ {"train_loss": 5.0098668969452955, "train_lr": 0.0004904488422028412, "train_wd": 0.3252278844883637, "epoch": 279}
281
+ {"train_loss": 5.006170619895562, "train_lr": 0.0004829940630161396, "train_wd": 0.32637160237443635, "epoch": 280}
282
+ {"train_loss": 4.999665899742707, "train_lr": 0.0004755809751189412, "train_wd": 0.32750875875901986, "epoch": 281}
283
+ {"train_loss": 4.995973670189615, "train_lr": 0.00046821005953589774, "train_wd": 0.3286392834969517, "epoch": 282}
284
+ {"train_loss": 4.988801797195304, "train_lr": 0.00046088179455515773, "train_wd": 0.3297631068521404, "epoch": 283}
285
+ {"train_loss": 4.985206558675074, "train_lr": 0.00045359665569733444, "train_wd": 0.3308801595018682, "epoch": 284}
286
+ {"train_loss": 4.979430549954482, "train_lr": 0.0004463551156846471, "train_wd": 0.3319903725410656, "epoch": 285}
287
+ {"train_loss": 4.973367940589822, "train_lr": 0.00043915764441025153, "train_wd": 0.3330936774865635, "epoch": 286}
288
+ {"train_loss": 4.966046810891631, "train_lr": 0.0004320047089077432, "train_wd": 0.33419000628131457, "epoch": 287}
289
+ {"train_loss": 4.962284815013051, "train_lr": 0.0004248967733208553, "train_wd": 0.335279291298595, "epoch": 288}
290
+ {"train_loss": 4.9562651147659444, "train_lr": 0.0004178342988733445, "train_wd": 0.33636146534617545, "epoch": 289}
291
+ {"train_loss": 4.95080055568001, "train_lr": 0.0004108177438390528, "train_wd": 0.3374364616704608, "epoch": 290}
292
+ {"train_loss": 4.944271500037014, "train_lr": 0.000403847563512187, "train_wd": 0.3385042139606152, "epoch": 291}
293
+ {"train_loss": 4.938631761434982, "train_lr": 0.00039692421017775475, "train_wd": 0.3395646563526489, "epoch": 292}
294
+ {"train_loss": 4.9333312649110095, "train_lr": 0.0003900481330822349, "train_wd": 0.3406177234334777, "epoch": 293}
295
+ {"train_loss": 4.92649072883941, "train_lr": 0.00038321977840441614, "train_wd": 0.34166335024496564, "epoch": 294}
296
+ {"train_loss": 4.920261191146122, "train_lr": 0.00037643958922644726, "train_wd": 0.3427014722879244, "epoch": 295}
297
+ {"train_loss": 4.912972134955639, "train_lr": 0.00036970800550508787, "train_wd": 0.3437320255260975, "epoch": 296}
298
+ {"train_loss": 4.906701816482652, "train_lr": 0.0003630254640431591, "train_wd": 0.34475494639010607, "epoch": 297}
299
+ {"train_loss": 4.899896893927234, "train_lr": 0.00035639239846120037, "train_wd": 0.34577017178137276, "epoch": 298}
300
+ {"train_loss": 4.892727703025801, "train_lr": 0.00034980923916933096, "train_wd": 0.34677763907601394, "epoch": 299}
301
+ {"train_loss": 4.886983189151156, "train_lr": 0.0003432764133393235, "train_wd": 0.3477772861287004, "epoch": 300}
302
+ {"train_loss": 4.8793741404938755, "train_lr": 0.00033679434487688504, "train_wd": 0.34876905127649377, "epoch": 301}
303
+ {"train_loss": 4.872865999515037, "train_lr": 0.0003303634543941485, "train_wd": 0.34975287334264904, "epoch": 302}
304
+ {"train_loss": 4.864671375620351, "train_lr": 0.0003239841591823808, "train_wd": 0.35072869164038517, "epoch": 303}
305
+ {"train_loss": 4.8587425362577825, "train_lr": 0.0003176568731849066, "train_wd": 0.35169644597663385, "epoch": 304}
306
+ {"train_loss": 4.851561189251695, "train_lr": 0.0003113820069702472, "train_wd": 0.3526560766557487, "epoch": 305}
307
+ {"train_loss": 4.845615127264596, "train_lr": 0.0003051599677054799, "train_wd": 0.353607524483189, "epoch": 306}
308
+ {"train_loss": 4.8380605704921615, "train_lr": 0.0002989911591298142, "train_wd": 0.3545507307691731, "epoch": 307}
309
+ {"train_loss": 4.829671723388439, "train_lr": 0.00029287598152839876, "train_wd": 0.3554856373322923, "epoch": 308}
310
+ {"train_loss": 4.8240739327969315, "train_lr": 0.00028681483170634587, "train_wd": 0.35641218650310563, "epoch": 309}
311
+ {"train_loss": 4.816649515431919, "train_lr": 0.00028080810296298114, "train_wd": 0.357330321127698, "epoch": 310}
312
+ {"train_loss": 4.808174640878285, "train_lr": 0.0002748561850663247, "train_wd": 0.3582399845711983, "epoch": 311}
313
+ {"train_loss": 4.800443130904894, "train_lr": 0.0002689594642277983, "train_wd": 0.35914112072128274, "epoch": 312}
314
+ {"train_loss": 4.7924962304443195, "train_lr": 0.0002631183230771692, "train_wd": 0.36003367399162767, "epoch": 313}
315
+ {"train_loss": 4.785386560918044, "train_lr": 0.0002573331406377131, "train_wd": 0.36091758932534296, "epoch": 314}
316
+ {"train_loss": 4.778378706800638, "train_lr": 0.00025160429230163016, "train_wd": 0.36179281219836784, "epoch": 315}
317
+ {"train_loss": 4.7710418455499255, "train_lr": 0.00024593214980567793, "train_wd": 0.3626592886228325, "epoch": 316}
318
+ {"train_loss": 4.763523285703765, "train_lr": 0.0002403170812070554, "train_wd": 0.36351696515039017, "epoch": 317}
319
+ {"train_loss": 4.754413338704146, "train_lr": 0.00023475945085951643, "train_wd": 0.364365788875511, "epoch": 318}
320
+ {"train_loss": 4.745593038742705, "train_lr": 0.000229259619389731, "train_wd": 0.3652057074387509, "epoch": 319}
321
+ {"train_loss": 4.738351850897717, "train_lr": 0.00022381794367388007, "train_wd": 0.3660366690299763, "epoch": 320}
322
+ {"train_loss": 4.728555572342029, "train_lr": 0.00021843477681450377, "train_wd": 0.36685862239156136, "epoch": 321}
323
+ {"train_loss": 4.71960553674282, "train_lr": 0.000213110468117585, "train_wd": 0.3676715168215523, "epoch": 322}
324
+ {"train_loss": 4.711377027143034, "train_lr": 0.00020784536306988464, "train_wd": 0.3684753021767905, "epoch": 323}
325
+ {"train_loss": 4.702829797231822, "train_lr": 0.00020263980331652434, "train_wd": 0.3692699288760087, "epoch": 324}
326
+ {"train_loss": 4.694897512049912, "train_lr": 0.00019749412663881707, "train_wd": 0.37005534790288946, "epoch": 325}
327
+ {"train_loss": 4.684425206993409, "train_lr": 0.00019240866693234784, "train_wd": 0.370831510809088, "epoch": 326}
328
+ {"train_loss": 4.67626074951687, "train_lr": 0.0001873837541853093, "train_wd": 0.37159836971722154, "epoch": 327}
329
+ {"train_loss": 4.666734198362922, "train_lr": 0.0001824197144570885, "train_wd": 0.37235587732381653, "epoch": 328}
330
+ {"train_loss": 4.658563957583133, "train_lr": 0.0001775168698571101, "train_wd": 0.3731039869022391, "epoch": 329}
331
+ {"train_loss": 4.651205594698302, "train_lr": 0.0001726755385239344, "train_wd": 0.37384265230556474, "epoch": 330}
332
+ {"train_loss": 4.640585822971176, "train_lr": 0.00016789603460461253, "train_wd": 0.37457182796943317, "epoch": 331}
333
+ {"train_loss": 4.631658425943242, "train_lr": 0.00016317866823430525, "train_wd": 0.37529146891485454, "epoch": 332}
334
+ {"train_loss": 4.6230639234560424, "train_lr": 0.0001585237455161564, "train_wd": 0.3760015307509843, "epoch": 333}
335
+ {"train_loss": 4.612211498067819, "train_lr": 0.00015393156850142972, "train_wd": 0.3767019696778652, "epoch": 334}
336
+ {"train_loss": 4.604454271155867, "train_lr": 0.00014940243516991158, "train_wd": 0.37739274248912325, "epoch": 335}
337
+ {"train_loss": 4.594165006103061, "train_lr": 0.0001449366394105728, "train_wd": 0.3780738065746397, "epoch": 336}
338
+ {"train_loss": 4.584006056386075, "train_lr": 0.00014053447100250053, "train_wd": 0.37874511992317167, "epoch": 337}
339
+ {"train_loss": 4.575067319074194, "train_lr": 0.0001361962155960943, "train_wd": 0.3794066411249504, "epoch": 338}
340
+ {"train_loss": 4.564600477169315, "train_lr": 0.00013192215469453092, "train_wd": 0.3800583293742328, "epoch": 339}
341
+ {"train_loss": 4.5560313582563285, "train_lr": 0.00012771256563549635, "train_wd": 0.3807001444718166, "epoch": 340}
342
+ {"train_loss": 4.546952808941368, "train_lr": 0.00012356772157319276, "train_wd": 0.3813320468275243, "epoch": 341}
343
+ {"train_loss": 4.536535692515133, "train_lr": 0.00011948789146061132, "train_wd": 0.3819539974626427, "epoch": 342}
344
+ {"train_loss": 4.528259229433122, "train_lr": 0.00011547334003208175, "train_wd": 0.3825659580123257, "epoch": 343}
345
+ {"train_loss": 4.517891302856682, "train_lr": 0.00011152432778609274, "train_wd": 0.3831678907279648, "epoch": 344}
346
+ {"train_loss": 4.506925072154695, "train_lr": 0.00010764111096839008, "train_wd": 0.38375975847951405, "epoch": 345}
347
+ {"train_loss": 4.49674551695478, "train_lr": 0.00010382394155534793, "train_wd": 0.3843415247577823, "epoch": 346}
348
+ {"train_loss": 4.488049700954478, "train_lr": 0.00010007306723761931, "train_wd": 0.38491315367668794, "epoch": 347}
349
+ {"train_loss": 4.47724774935477, "train_lr": 9.638873140406401e-05, "train_wd": 0.3854746099754623, "epoch": 348}
350
+ {"train_loss": 4.466251426624308, "train_lr": 9.277117312595344e-05, "train_wd": 0.3860258590208386, "epoch": 349}
351
+ {"train_loss": 4.457804220185863, "train_lr": 8.922062714146099e-05, "train_wd": 0.3865668668091791, "epoch": 350}
352
+ {"train_loss": 4.44732800053714, "train_lr": 8.573732384042698e-05, "train_wd": 0.3870975999685752, "epoch": 351}
353
+ {"train_loss": 4.436543436055418, "train_lr": 8.232148924941129e-05, "train_wd": 0.3876180257609052, "epoch": 352}
354
+ {"train_loss": 4.426954548127002, "train_lr": 7.897334501702503e-05, "train_wd": 0.3881281120838543, "epoch": 353}
355
+ {"train_loss": 4.41578244219581, "train_lr": 7.569310839954948e-05, "train_wd": 0.3886278274728974, "epoch": 354}
356
+ {"train_loss": 4.407736654949488, "train_lr": 7.248099224683806e-05, "train_wd": 0.38911714110323253, "epoch": 355}
357
+ {"train_loss": 4.395862544299387, "train_lr": 6.933720498850462e-05, "train_wd": 0.38959602279169175, "epoch": 356}
358
+ {"train_loss": 4.386592810486647, "train_lr": 6.626195062039929e-05, "train_wd": 0.39006444299859705, "epoch": 357}
359
+ {"train_loss": 4.375733322153489, "train_lr": 6.325542869137099e-05, "train_wd": 0.3905223728295828, "epoch": 358}
360
+ {"train_loss": 4.36565443567878, "train_lr": 6.031783429031898e-05, "train_wd": 0.3909697840373807, "epoch": 359}
361
+ {"train_loss": 4.355564466393966, "train_lr": 5.7449358033534445e-05, "train_wd": 0.3914066490235593, "epoch": 360}
362
+ {"train_loss": 4.344885043210263, "train_lr": 5.465018605233098e-05, "train_wd": 0.3918329408402287, "epoch": 361}
363
+ {"train_loss": 4.335520960051093, "train_lr": 5.192049998096696e-05, "train_wd": 0.39224863319170084, "epoch": 362}
364
+ {"train_loss": 4.326140600616197, "train_lr": 4.926047694485985e-05, "train_wd": 0.3926537004361162, "epoch": 363}
365
+ {"train_loss": 4.31593851194822, "train_lr": 4.6670289549092546e-05, "train_wd": 0.3930481175870156, "epoch": 364}
366
+ {"train_loss": 4.306212983417997, "train_lr": 4.4150105867213124e-05, "train_wd": 0.3934318603148934, "epoch": 365}
367
+ {"train_loss": 4.298082825788062, "train_lr": 4.1700089430329086e-05, "train_wd": 0.39380490494868947, "epoch": 366}
368
+ {"train_loss": 4.286265307398652, "train_lr": 3.932039921649631e-05, "train_wd": 0.3941672284772548, "epoch": 367}
369
+ {"train_loss": 4.276728308431322, "train_lr": 3.701118964040234e-05, "train_wd": 0.39451880855076554, "epoch": 368}
370
+ {"train_loss": 4.268159883110214, "train_lr": 3.4772610543347296e-05, "train_wd": 0.3948596234821091, "epoch": 369}
371
+ {"train_loss": 4.258168973100128, "train_lr": 3.2604807183520946e-05, "train_wd": 0.3951896522482136, "epoch": 370}
372
+ {"train_loss": 4.249997297404624, "train_lr": 3.0507920226576605e-05, "train_wd": 0.3955088744913507, "epoch": 371}
373
+ {"train_loss": 4.242101726941853, "train_lr": 2.8482085736503965e-05, "train_wd": 0.3958172705203882, "epoch": 372}
374
+ {"train_loss": 4.232887092924161, "train_lr": 2.652743516679996e-05, "train_wd": 0.3961148213120063, "epoch": 373}
375
+ {"train_loss": 4.2237875755313485, "train_lr": 2.4644095351939004e-05, "train_wd": 0.3964015085118724, "epoch": 374}
376
+ {"train_loss": 4.217320317728556, "train_lr": 2.283218849914263e-05, "train_wd": 0.3966773144357674, "epoch": 375}
377
+ {"train_loss": 4.207789967975599, "train_lr": 2.1091832180450064e-05, "train_wd": 0.3969422220706831, "epoch": 376}
378
+ {"train_loss": 4.200360547483182, "train_lr": 1.942313932508876e-05, "train_wd": 0.3971962150758693, "epoch": 377}
379
+ {"train_loss": 4.193593175621698, "train_lr": 1.782621821214669e-05, "train_wd": 0.3974392777838421, "epoch": 378}
380
+ {"train_loss": 4.185997710435939, "train_lr": 1.630117246354651e-05, "train_wd": 0.3976713952013454, "epoch": 379}
381
+ {"train_loss": 4.179574521495212, "train_lr": 1.4848101037321326e-05, "train_wd": 0.3978925530102874, "epoch": 380}
382
+ {"train_loss": 4.170817840174377, "train_lr": 1.3467098221193672e-05, "train_wd": 0.3981027375686105, "epoch": 381}
383
+ {"train_loss": 4.165872473618109, "train_lr": 1.2158253626457194e-05, "train_wd": 0.39830193591114177, "epoch": 382}
384
+ {"train_loss": 4.158825963172767, "train_lr": 1.092165218216205e-05, "train_wd": 0.39849013575038866, "epoch": 383}
385
+ {"train_loss": 4.154229786845563, "train_lr": 9.75737412960382e-06, "train_wd": 0.398667325477299, "epoch": 384}
386
+ {"train_loss": 4.148727393470151, "train_lr": 8.6654950171168e-06, "train_wd": 0.3988334941619753, "epoch": 385}
387
+ {"train_loss": 4.143364845393158, "train_lr": 7.646085695171953e-06, "train_wd": 0.3989886315543516, "epoch": 386}
388
+ {"train_loss": 4.139082619996308, "train_lr": 6.699212311779304e-06, "train_wd": 0.39913272808482037, "epoch": 387}
389
+ {"train_loss": 4.13602033943581, "train_lr": 5.824936308195733e-06, "train_wd": 0.3992657748648322, "epoch": 388}
390
+ {"train_loss": 4.1309623175905905, "train_lr": 5.0233144149382675e-06, "train_wd": 0.3993877636874319, "epoch": 389}
391
+ {"train_loss": 4.1286045256153425, "train_lr": 4.294398648102762e-06, "train_wd": 0.3994986870277766, "epoch": 390}
392
+ {"train_loss": 4.125183607167978, "train_lr": 3.63823630598877e-06, "train_wd": 0.39959853804359, "epoch": 391}
393
+ {"train_loss": 4.121790976368552, "train_lr": 3.054869966030341e-06, "train_wd": 0.3996873105755923, "epoch": 392}
394
+ {"train_loss": 4.118684218539823, "train_lr": 2.5443374820332894e-06, "train_wd": 0.3997649991478766, "epoch": 393}
395
+ {"train_loss": 4.116305466446517, "train_lr": 2.1066719817188773e-06, "train_wd": 0.3998315989682437, "epoch": 394}
396
+ {"train_loss": 4.114498018244688, "train_lr": 1.741901864574217e-06, "train_wd": 0.39988710592850374, "epoch": 395}
397
+ {"train_loss": 4.113448657720781, "train_lr": 1.450050800009479e-06, "train_wd": 0.3999315166047262, "epoch": 396}
398
+ {"train_loss": 4.111802810200041, "train_lr": 1.2311377258219986e-06, "train_wd": 0.3999648282574527, "epoch": 397}
399
+ {"train_loss": 4.111367762839194, "train_lr": 1.0851768469674523e-06, "train_wd": 0.3999870388318609, "epoch": 398}
400
+ {"train_loss": 4.111147170006443, "train_lr": 1.0121776346380885e-06, "train_wd": 0.39999814695790026, "epoch": 399}
Vim/Small/log_eval.txt ADDED
@@ -0,0 +1,100 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"train_lr": 0.0019999999999998686, "train_loss": 1.5462792072887188, "epoch": 0, "test_loss": 1.0653163286502405, "test_acc1": 73.264, "test_acc5": 92.156}
2
+ {"train_lr": 0.0019995065603657376, "train_loss": 1.1620918199795034, "epoch": 1, "test_loss": 0.9953323697952359, "test_acc1": 74.706, "test_acc5": 92.786}
3
+ {"train_lr": 0.0019980267284282105, "train_loss": 1.093948356018417, "epoch": 2, "test_loss": 0.9654222754261378, "test_acc1": 75.196, "test_acc5": 93.08}
4
+ {"train_lr": 0.001995561964603092, "train_loss": 1.055096378314033, "epoch": 3, "test_loss": 0.9451440002607263, "test_acc1": 75.702, "test_acc5": 93.248}
5
+ {"train_lr": 0.0019921147013145773, "train_loss": 1.0299462808211994, "epoch": 4, "test_loss": 0.9315123357202696, "test_acc1": 75.86, "test_acc5": 93.354}
6
+ {"train_lr": 0.0019876883405950175, "train_loss": 1.00895006465307, "epoch": 5, "test_loss": 0.9217294724586674, "test_acc1": 76.066, "test_acc5": 93.44}
7
+ {"train_lr": 0.0019822872507288198, "train_loss": 0.9937279445442542, "epoch": 6, "test_loss": 0.9183257005899154, "test_acc1": 76.246, "test_acc5": 93.478}
8
+ {"train_lr": 0.0019759167619387524, "train_loss": 0.9801143079823462, "epoch": 7, "test_loss": 0.9134514866125248, "test_acc1": 76.328, "test_acc5": 93.546}
9
+ {"train_lr": 0.001968583161128624, "train_loss": 0.9713082210783286, "epoch": 8, "test_loss": 0.909379768764119, "test_acc1": 76.252, "test_acc5": 93.602}
10
+ {"train_lr": 0.001960293685677003, "train_loss": 0.964412150457293, "epoch": 9, "test_loss": 0.9043817922587285, "test_acc1": 76.374, "test_acc5": 93.652}
11
+ {"train_lr": 0.0019510565162951365, "train_loss": 0.9554298663771585, "epoch": 10, "test_loss": 0.9048832649617549, "test_acc1": 76.41, "test_acc5": 93.65}
12
+ {"train_lr": 0.0019408807689541316, "train_loss": 0.952100750066331, "epoch": 11, "test_loss": 0.9035057433311592, "test_acc1": 76.434, "test_acc5": 93.618}
13
+ {"train_lr": 0.0019297764858882515, "train_loss": 0.94578595869645, "epoch": 12, "test_loss": 0.8990269072182343, "test_acc1": 76.604, "test_acc5": 93.746}
14
+ {"train_lr": 0.0019177546256839834, "train_loss": 0.9423461016051731, "epoch": 13, "test_loss": 0.8976540658480067, "test_acc1": 76.452, "test_acc5": 93.732}
15
+ {"train_lr": 0.0019048270524661083, "train_loss": 0.9392712370418473, "epoch": 14, "test_loss": 0.8979446694559758, "test_acc1": 76.582, "test_acc5": 93.708}
16
+ {"train_lr": 0.0018910065241883177, "train_loss": 0.9348282062329867, "epoch": 15, "test_loss": 0.8960327804660249, "test_acc1": 76.604, "test_acc5": 93.764}
17
+ {"train_lr": 0.0018763066800438779, "train_loss": 0.9309803891839192, "epoch": 16, "test_loss": 0.8942813928932181, "test_acc1": 76.584, "test_acc5": 93.688}
18
+ {"train_lr": 0.0018607420270040137, "train_loss": 0.9286438047058383, "epoch": 17, "test_loss": 0.8942481704875637, "test_acc1": 76.726, "test_acc5": 93.712}
19
+ {"train_lr": 0.001844327925502041, "train_loss": 0.9258772233159505, "epoch": 18, "test_loss": 0.8927681097937057, "test_acc1": 76.704, "test_acc5": 93.764}
20
+ {"train_lr": 0.0018270805742745338, "train_loss": 0.9242971756019642, "epoch": 19, "test_loss": 0.8923569080584189, "test_acc1": 76.826, "test_acc5": 93.816}
21
+ {"train_lr": 0.0018090169943749148, "train_loss": 0.9208041346857798, "epoch": 20, "test_loss": 0.8913304988494919, "test_acc1": 76.728, "test_acc5": 93.826}
22
+ {"train_lr": 0.001790155012375684, "train_loss": 0.9207657220104767, "epoch": 21, "test_loss": 0.8900808066015353, "test_acc1": 76.684, "test_acc5": 93.822}
23
+ {"train_lr": 0.00177051324277586, "train_loss": 0.9167353716127119, "epoch": 22, "test_loss": 0.8917422776522539, "test_acc1": 76.646, "test_acc5": 93.802}
24
+ {"train_lr": 0.0017501110696303821, "train_loss": 0.9158053922798459, "epoch": 23, "test_loss": 0.889882964322634, "test_acc1": 76.668, "test_acc5": 93.794}
25
+ {"train_lr": 0.001728968627421389, "train_loss": 0.9145920997231758, "epoch": 24, "test_loss": 0.8899718871163895, "test_acc1": 76.864, "test_acc5": 93.764}
26
+ {"train_lr": 0.0017071067811865767, "train_loss": 0.9132478059713383, "epoch": 25, "test_loss": 0.8884405900374093, "test_acc1": 76.918, "test_acc5": 93.838}
27
+ {"train_lr": 0.0016845471059286062, "train_loss": 0.9135288151261619, "epoch": 26, "test_loss": 0.889947284765713, "test_acc1": 76.83, "test_acc5": 93.784}
28
+ {"train_lr": 0.001661311865323677, "train_loss": 0.910536366724344, "epoch": 27, "test_loss": 0.8899172185479528, "test_acc1": 76.842, "test_acc5": 93.792}
29
+ {"train_lr": 0.001637423989748733, "train_loss": 0.9118115852147496, "epoch": 28, "test_loss": 0.8893519162445727, "test_acc1": 76.818, "test_acc5": 93.858}
30
+ {"train_lr": 0.001612907053652909, "train_loss": 0.9095455825126414, "epoch": 29, "test_loss": 0.8880549875824043, "test_acc1": 76.744, "test_acc5": 93.84}
31
+ {"train_lr": 0.0015877852522924111, "train_loss": 0.9071214361621578, "epoch": 30, "test_loss": 0.8855601080771908, "test_acc1": 76.932, "test_acc5": 93.846}
32
+ {"train_lr": 0.0015620833778521046, "train_loss": 0.9051265161167465, "epoch": 31, "test_loss": 0.8861170669307794, "test_acc1": 76.906, "test_acc5": 93.85}
33
+ {"train_lr": 0.0015358267949790963, "train_loss": 0.9058243562960405, "epoch": 32, "test_loss": 0.8854435998803515, "test_acc1": 76.872, "test_acc5": 93.84}
34
+ {"train_lr": 0.0015090414157503675, "train_loss": 0.90287453468697, "epoch": 33, "test_loss": 0.884228560568579, "test_acc1": 76.972, "test_acc5": 93.86}
35
+ {"train_lr": 0.0014817536741017646, "train_loss": 0.9030093112785579, "epoch": 34, "test_loss": 0.885163737932587, "test_acc1": 76.958, "test_acc5": 93.858}
36
+ {"train_lr": 0.001453990499739611, "train_loss": 0.9012188788382853, "epoch": 35, "test_loss": 0.8846786753715151, "test_acc1": 76.884, "test_acc5": 93.862}
37
+ {"train_lr": 0.0014257792915651636, "train_loss": 0.8998472729368159, "epoch": 36, "test_loss": 0.8848289616425019, "test_acc1": 76.898, "test_acc5": 93.866}
38
+ {"train_lr": 0.001397147890634744, "train_loss": 0.9015668814259913, "epoch": 37, "test_loss": 0.8833087302763444, "test_acc1": 76.91, "test_acc5": 93.898}
39
+ {"train_lr": 0.001368124552684745, "train_loss": 0.899501782352692, "epoch": 38, "test_loss": 0.8840746038862507, "test_acc1": 77.044, "test_acc5": 93.862}
40
+ {"train_lr": 0.0013387379202453142, "train_loss": 0.8990368374522524, "epoch": 39, "test_loss": 0.8824718763189547, "test_acc1": 76.984, "test_acc5": 93.922}
41
+ {"train_lr": 0.0013090169943749093, "train_loss": 0.8948185657542846, "epoch": 40, "test_loss": 0.8814613452881498, "test_acc1": 77.056, "test_acc5": 93.864}
42
+ {"train_lr": 0.0012789911060391633, "train_loss": 0.895819385621222, "epoch": 41, "test_loss": 0.881209047439763, "test_acc1": 77.002, "test_acc5": 93.854}
43
+ {"train_lr": 0.0012486898871647862, "train_loss": 0.897623048378642, "epoch": 42, "test_loss": 0.8843644160367644, "test_acc1": 76.858, "test_acc5": 93.896}
44
+ {"train_lr": 0.001218143241396569, "train_loss": 0.8947948385751872, "epoch": 43, "test_loss": 0.8816810119754214, "test_acc1": 76.9, "test_acc5": 93.894}
45
+ {"train_lr": 0.0011873813145856604, "train_loss": 0.8958690658723694, "epoch": 44, "test_loss": 0.8802744570328757, "test_acc1": 76.964, "test_acc5": 93.894}
46
+ {"train_lr": 0.0011564344650402871, "train_loss": 0.8941386539669118, "epoch": 45, "test_loss": 0.8818962137069544, "test_acc1": 77.004, "test_acc5": 93.898}
47
+ {"train_lr": 0.0011253332335643327, "train_loss": 0.8925709486829249, "epoch": 46, "test_loss": 0.8812150349435599, "test_acc1": 76.984, "test_acc5": 93.946}
48
+ {"train_lr": 0.001094108313318475, "train_loss": 0.8926951521683872, "epoch": 47, "test_loss": 0.8807723995136179, "test_acc1": 77.03, "test_acc5": 93.906}
49
+ {"train_lr": 0.0010627905195293463, "train_loss": 0.8915551941822493, "epoch": 48, "test_loss": 0.8798098120924152, "test_acc1": 76.936, "test_acc5": 93.93}
50
+ {"train_lr": 0.0010314107590780974, "train_loss": 0.8887458967831532, "epoch": 49, "test_loss": 0.8787258478343639, "test_acc1": 77.078, "test_acc5": 93.91}
51
+ {"train_lr": 0.0009999999999999343, "train_loss": 0.8909619553680663, "epoch": 50, "test_loss": 0.8777747804017932, "test_acc1": 77.03, "test_acc5": 93.92}
52
+ {"train_lr": 0.0009685892409218651, "train_loss": 0.8911836404045296, "epoch": 51, "test_loss": 0.8794785176815889, "test_acc1": 76.994, "test_acc5": 93.928}
53
+ {"train_lr": 0.0009372094804707101, "train_loss": 0.8884809423078788, "epoch": 52, "test_loss": 0.8785548080187624, "test_acc1": 77.076, "test_acc5": 93.932}
54
+ {"train_lr": 0.0009058916866814987, "train_loss": 0.8882480381496468, "epoch": 53, "test_loss": 0.8784954836949364, "test_acc1": 77.028, "test_acc5": 93.916}
55
+ {"train_lr": 0.0008746667664356905, "train_loss": 0.8895337167075049, "epoch": 54, "test_loss": 0.8795459202450254, "test_acc1": 77.006, "test_acc5": 93.848}
56
+ {"train_lr": 0.0008435655349597399, "train_loss": 0.8860804490295592, "epoch": 55, "test_loss": 0.8787395966517956, "test_acc1": 77.044, "test_acc5": 93.922}
57
+ {"train_lr": 0.0008126186854142688, "train_loss": 0.8864286131725233, "epoch": 56, "test_loss": 0.8758610734320662, "test_acc1": 77.116, "test_acc5": 93.944}
58
+ {"train_lr": 0.0007818567586034925, "train_loss": 0.8868225071902186, "epoch": 57, "test_loss": 0.8770260750828192, "test_acc1": 77.132, "test_acc5": 93.924}
59
+ {"train_lr": 0.0007513101128351359, "train_loss": 0.8849723490414217, "epoch": 58, "test_loss": 0.8765480796546887, "test_acc1": 77.166, "test_acc5": 93.926}
60
+ {"train_lr": 0.000721008893960812, "train_loss": 0.8831905472965608, "epoch": 59, "test_loss": 0.8764536295400556, "test_acc1": 77.14, "test_acc5": 93.92}
61
+ {"train_lr": 0.0006909830056250302, "train_loss": 0.8828135836025595, "epoch": 60, "test_loss": 0.8774458002632536, "test_acc1": 77.156, "test_acc5": 93.876}
62
+ {"train_lr": 0.0006612620797547435, "train_loss": 0.8831019367794966, "epoch": 61, "test_loss": 0.8758931152732171, "test_acc1": 77.222, "test_acc5": 93.924}
63
+ {"train_lr": 0.0006318754473153419, "train_loss": 0.8837904712937614, "epoch": 62, "test_loss": 0.8759348775114855, "test_acc1": 77.21, "test_acc5": 93.89}
64
+ {"train_lr": 0.0006028521093652263, "train_loss": 0.882364670631055, "epoch": 63, "test_loss": 0.8754696204229389, "test_acc1": 77.172, "test_acc5": 93.87}
65
+ {"train_lr": 0.000574220708434935, "train_loss": 0.8827679880228321, "epoch": 64, "test_loss": 0.8748686394613722, "test_acc1": 77.198, "test_acc5": 93.882}
66
+ {"train_lr": 0.0005460095002604524, "train_loss": 0.880867308814598, "epoch": 65, "test_loss": 0.8757139533338949, "test_acc1": 77.214, "test_acc5": 93.906}
67
+ {"train_lr": 0.0005182463258982946, "train_loss": 0.8807085690483349, "epoch": 66, "test_loss": 0.8745943027574693, "test_acc1": 77.198, "test_acc5": 93.884}
68
+ {"train_lr": 0.0004909585842496341, "train_loss": 0.8804059327750077, "epoch": 67, "test_loss": 0.8754880680033313, "test_acc1": 77.214, "test_acc5": 93.888}
69
+ {"train_lr": 0.0004641732050210111, "train_loss": 0.8800576613264183, "epoch": 68, "test_loss": 0.8737323259567971, "test_acc1": 77.158, "test_acc5": 93.932}
70
+ {"train_lr": 0.0004379166221478616, "train_loss": 0.8782465891585891, "epoch": 69, "test_loss": 0.8744356098306149, "test_acc1": 77.232, "test_acc5": 93.898}
71
+ {"train_lr": 0.00041221474770750024, "train_loss": 0.8775008486280954, "epoch": 70, "test_loss": 0.8731217507816031, "test_acc1": 77.248, "test_acc5": 93.934}
72
+ {"train_lr": 0.0003870929463470055, "train_loss": 0.8789784855518492, "epoch": 71, "test_loss": 0.872324996020483, "test_acc1": 77.336, "test_acc5": 93.934}
73
+ {"train_lr": 0.0003625760102513295, "train_loss": 0.8785202709189235, "epoch": 72, "test_loss": 0.8731379475053924, "test_acc1": 77.234, "test_acc5": 93.906}
74
+ {"train_lr": 0.0003386881346763327, "train_loss": 0.8758976873199414, "epoch": 73, "test_loss": 0.8730513187854186, "test_acc1": 77.224, "test_acc5": 93.896}
75
+ {"train_lr": 0.0003154528940713109, "train_loss": 0.8774554843735657, "epoch": 74, "test_loss": 0.8731896214930298, "test_acc1": 77.292, "test_acc5": 93.918}
76
+ {"train_lr": 0.00029289321881343744, "train_loss": 0.876272294835548, "epoch": 75, "test_loss": 0.8719317844266172, "test_acc1": 77.282, "test_acc5": 93.948}
77
+ {"train_lr": 0.0002710313725785874, "train_loss": 0.87604077666986, "epoch": 76, "test_loss": 0.8720863432530552, "test_acc1": 77.356, "test_acc5": 93.93}
78
+ {"train_lr": 0.0002498889303695469, "train_loss": 0.8773246523985565, "epoch": 77, "test_loss": 0.8718440565840363, "test_acc1": 77.318, "test_acc5": 93.972}
79
+ {"train_lr": 0.0002294867572242191, "train_loss": 0.8755367963053539, "epoch": 78, "test_loss": 0.8719188288578292, "test_acc1": 77.28, "test_acc5": 93.936}
80
+ {"train_lr": 0.0002098449876243195, "train_loss": 0.8756687853439208, "epoch": 79, "test_loss": 0.8718071426729412, "test_acc1": 77.262, "test_acc5": 93.954}
81
+ {"train_lr": 0.00019098300562504553, "train_loss": 0.8743142408523091, "epoch": 80, "test_loss": 0.8718557763854256, "test_acc1": 77.312, "test_acc5": 93.942}
82
+ {"train_lr": 0.00017291942572544524, "train_loss": 0.8728714693982126, "epoch": 81, "test_loss": 0.8716417792851053, "test_acc1": 77.26, "test_acc5": 93.942}
83
+ {"train_lr": 0.0001556720744979767, "train_loss": 0.8737623748770248, "epoch": 82, "test_loss": 0.8721112250671972, "test_acc1": 77.252, "test_acc5": 93.984}
84
+ {"train_lr": 0.00013925797299606019, "train_loss": 0.8760512217141083, "epoch": 83, "test_loss": 0.8718814796689526, "test_acc1": 77.298, "test_acc5": 93.946}
85
+ {"train_lr": 0.00012369331995613583, "train_loss": 0.8744523789416634, "epoch": 84, "test_loss": 0.8716564924096513, "test_acc1": 77.25, "test_acc5": 93.972}
86
+ {"train_lr": 0.00010899347581163435, "train_loss": 0.8728500791682846, "epoch": 85, "test_loss": 0.8717586801142034, "test_acc1": 77.272, "test_acc5": 93.96}
87
+ {"train_lr": 9.5172947533978e-05, "train_loss": 0.8723777536982972, "epoch": 86, "test_loss": 0.8714664308425716, "test_acc1": 77.336, "test_acc5": 93.952}
88
+ {"train_lr": 8.224537431602316e-05, "train_loss": 0.8740031649911113, "epoch": 87, "test_loss": 0.8713907648230452, "test_acc1": 77.326, "test_acc5": 93.938}
89
+ {"train_lr": 7.022351411175157e-05, "train_loss": 0.8725077246028902, "epoch": 88, "test_loss": 0.8715437166297527, "test_acc1": 77.322, "test_acc5": 93.942}
90
+ {"train_lr": 5.911923104577377e-05, "train_loss": 0.8716816987501493, "epoch": 89, "test_loss": 0.8713589954139936, "test_acc1": 77.31, "test_acc5": 93.956}
91
+ {"train_lr": 4.8943483704848814e-05, "train_loss": 0.8709226178494254, "epoch": 90, "test_loss": 0.8714540137163819, "test_acc1": 77.306, "test_acc5": 93.942}
92
+ {"train_lr": 3.9706314323055196e-05, "train_loss": 0.8717560150500206, "epoch": 91, "test_loss": 0.8712906101932916, "test_acc1": 77.33, "test_acc5": 93.956}
93
+ {"train_lr": 3.141683887136792e-05, "train_loss": 0.8714423571235886, "epoch": 92, "test_loss": 0.871273936613289, "test_acc1": 77.358, "test_acc5": 93.942}
94
+ {"train_lr": 2.4083238061252423e-05, "train_loss": 0.8698204204505603, "epoch": 93, "test_loss": 0.8711841354894516, "test_acc1": 77.328, "test_acc5": 93.95}
95
+ {"train_lr": 1.7712749271312274e-05, "train_loss": 0.8716913644690253, "epoch": 94, "test_loss": 0.8711778729811044, "test_acc1": 77.326, "test_acc5": 93.954}
96
+ {"train_lr": 1.2311659404861753e-05, "train_loss": 0.8734283813365069, "epoch": 95, "test_loss": 0.8711828852019956, "test_acc1": 77.308, "test_acc5": 93.948}
97
+ {"train_lr": 7.885298685522277e-06, "train_loss": 0.8702041474232376, "epoch": 96, "test_loss": 0.8711996051432837, "test_acc1": 77.298, "test_acc5": 93.946}
98
+ {"train_lr": 4.4380353969200165e-06, "train_loss": 0.8719592322820527, "epoch": 97, "test_loss": 0.8711975683908328, "test_acc1": 77.3, "test_acc5": 93.944}
99
+ {"train_lr": 1.9732715717283947e-06, "train_loss": 0.8701257964717451, "epoch": 98, "test_loss": 0.8711981868652432, "test_acc1": 77.3, "test_acc5": 93.94}
100
+ {"train_lr": 4.934396342684219e-07, "train_loss": 0.8710531863364228, "epoch": 99, "test_loss": 0.8711977390681996, "test_acc1": 77.3, "test_acc5": 93.94}
Vim/Tiny/checkpoint.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50d6b140e664465bd3c361e8e9a71ce35f0218a32bf35361336f2d211448f918
3
+ size 525052196
Vim/Tiny/checkpoint.pth.tar ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13965b5215d0499c599b0a644f036380a39446ced57154a2fdb63dc23d72d308
3
+ size 16394632
Vim/Tiny/config.txt ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ arch: vim_tiny_patch16_224
2
+ batch_size_per_gpu: 64
3
+ clip_grad: 3.0
4
+ drop_path_rate: 0.1
5
+ epochs: 300
6
+ freeze_last_layer: 1
7
+ global_crops_scale: (0.4, 1.0)
8
+ gpu: 0
9
+ local_crops_number: 8
10
+ local_crops_scale: (0.05, 0.4)
11
+ local_rank: 0
12
+ lr: 0.0005
13
+ min_lr: 1e-06
14
+ momentum_teacher: 0.996
15
+ ngpus: 8
16
+ nodes: 2
17
+ norm_last_layer: True
18
+ num_workers: 10
19
+ optimizer: adamw
20
+ out_dim: 65536
21
+ partition: main
22
+ patch_size: 16
23
+ rank: 0
24
+ saveckp_freq: 5
25
+ seed: 0
26
+ teacher_temp: 0.07
27
+ use_bn_in_head: False
28
+ use_fp16: True (bf16)
29
+ use_volta32: False
30
+ warmup_epochs: 10
31
+ warmup_teacher_temp: 0.04
32
+ warmup_teacher_temp_epochs: 30
33
+ weight_decay: 0.04
34
+ weight_decay_end: 0.4
35
+ world_size: 16
Vim/Tiny/log.txt ADDED
@@ -0,0 +1,300 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"train_loss": 9.422255354486019, "train_lr": 9.992805180270203e-05, "train_wd": 0.04000328590649605, "epoch": 0}
2
+ {"train_loss": 9.149647276261918, "train_lr": 0.00029994404029099034, "train_wd": 0.04002301668527509, "epoch": 1}
3
+ {"train_loss": 8.820922415581443, "train_lr": 0.0004999600287792787, "train_wd": 0.040062483968430894, "epoch": 2}
4
+ {"train_loss": 7.248332084702263, "train_lr": 0.0006999760172675668, "train_wd": 0.040121683427931, "epoch": 3}
5
+ {"train_loss": 6.398293628705015, "train_lr": 0.0008999920057558545, "train_wd": 0.04020060857188757, "epoch": 4}
6
+ {"train_loss": 5.894707517134105, "train_lr": 0.0011000079942441437, "train_wd": 0.04029925074526934, "epoch": 5}
7
+ {"train_loss": 5.57176185821553, "train_lr": 0.0013000239827324325, "train_wd": 0.04041759913085018, "epoch": 6}
8
+ {"train_loss": 5.343682085009788, "train_lr": 0.00150003997122072, "train_wd": 0.04055564075039605, "epoch": 7}
9
+ {"train_loss": 5.173390032171155, "train_lr": 0.0017000559597090108, "train_wd": 0.04071336046608778, "epoch": 8}
10
+ {"train_loss": 5.05073303548838, "train_lr": 0.0019000719481972992, "train_wd": 0.040890740982181185, "epoch": 9}
11
+ {"train_loss": 4.955588597735817, "train_lr": 0.0019999804740649203, "train_wd": 0.04108776284690386, "epoch": 10}
12
+ {"train_loss": 4.887250697322124, "train_lr": 0.0019998632274806126, "train_wd": 0.04130440445458789, "epoch": 11}
13
+ {"train_loss": 4.843188836134309, "train_lr": 0.0019996287011906193, "train_wd": 0.041540642048039866, "epoch": 12}
14
+ {"train_loss": 4.814737065637902, "train_lr": 0.0019992769227176214, "train_wd": 0.04179644972114549, "epoch": 13}
15
+ {"train_loss": 4.7942842399950125, "train_lr": 0.001998807933344397, "train_wd": 0.04207179942171064, "epoch": 14}
16
+ {"train_loss": 4.780849778204322, "train_lr": 0.001998221788108922, "train_wd": 0.0423666609545378, "epoch": 15}
17
+ {"train_loss": 4.771869034170628, "train_lr": 0.0019975185557979396, "train_wd": 0.04268100198473705, "epoch": 16}
18
+ {"train_loss": 4.765753432715254, "train_lr": 0.001996698318938875, "train_wd": 0.04301478804127214, "epoch": 17}
19
+ {"train_loss": 4.76710769388792, "train_lr": 0.001995761173790171, "train_wd": 0.04336798252074061, "epoch": 18}
20
+ {"train_loss": 4.77000752067585, "train_lr": 0.0019947072303299626, "train_wd": 0.04374054669138758, "epoch": 19}
21
+ {"train_loss": 4.777466228992628, "train_lr": 0.001993536612243176, "train_wd": 0.04413243969735341, "epoch": 20}
22
+ {"train_loss": 4.789177372277402, "train_lr": 0.0019922494569070475, "train_wd": 0.0445436185631536, "epoch": 21}
23
+ {"train_loss": 4.804613028403571, "train_lr": 0.001990845915374956, "train_wd": 0.04497403819839207, "epoch": 22}
24
+ {"train_loss": 4.822053124030813, "train_lr": 0.00198932615235873, "train_wd": 0.045423651402705455, "epoch": 23}
25
+ {"train_loss": 4.845032735455999, "train_lr": 0.001987690346209293, "train_wd": 0.04589240887093915, "epoch": 24}
26
+ {"train_loss": 4.87204266714154, "train_lr": 0.001985938688895749, "train_wd": 0.04638025919855438, "epoch": 25}
27
+ {"train_loss": 4.904736080448881, "train_lr": 0.00198407138598285, "train_wd": 0.04688714888726504, "epoch": 26}
28
+ {"train_loss": 4.945652410661955, "train_lr": 0.0019820886566068725, "train_wd": 0.0474130223509048, "epoch": 27}
29
+ {"train_loss": 5.000821680735817, "train_lr": 0.001979990733449899, "train_wd": 0.04795782192152221, "epoch": 28}
30
+ {"train_loss": 5.086788926407587, "train_lr": 0.0019777778627125204, "train_wd": 0.04852148785570515, "epoch": 29}
31
+ {"train_loss": 5.144751373907741, "train_lr": 0.0019754503040849123, "train_wd": 0.04910395834113187, "epoch": 30}
32
+ {"train_loss": 5.191997510923756, "train_lr": 0.00197300833071642, "train_wd": 0.049705169503349717, "epoch": 31}
33
+ {"train_loss": 5.2221205586866795, "train_lr": 0.0019704522291834345, "train_wd": 0.05032505541277995, "epoch": 32}
34
+ {"train_loss": 5.234231495004383, "train_lr": 0.001967782299455807, "train_wd": 0.05096354809194695, "epoch": 33}
35
+ {"train_loss": 5.24043213346784, "train_lr": 0.001964998854861625, "train_wd": 0.05162057752293346, "epoch": 34}
36
+ {"train_loss": 5.240060033296033, "train_lr": 0.0019621022220504525, "train_wd": 0.052296071655058056, "epoch": 35}
37
+ {"train_loss": 5.236362775833868, "train_lr": 0.0019590927409550065, "train_wd": 0.052989956412777164, "epoch": 36}
38
+ {"train_loss": 5.234892796007373, "train_lr": 0.0019559707647512155, "train_wd": 0.05370215570380788, "epoch": 37}
39
+ {"train_loss": 5.222516710237919, "train_lr": 0.0019527366598168455, "train_wd": 0.054432591427471845, "epoch": 38}
40
+ {"train_loss": 5.2180857766303514, "train_lr": 0.0019493908056884435, "train_wd": 0.05518118348326112, "epoch": 39}
41
+ {"train_loss": 5.217184919747803, "train_lr": 0.0019459335950168233, "train_wd": 0.05594784977962063, "epoch": 40}
42
+ {"train_loss": 5.223070632043979, "train_lr": 0.0019423654335209903, "train_wd": 0.05673250624295146, "epoch": 41}
43
+ {"train_loss": 5.232140705406333, "train_lr": 0.0019386867399405164, "train_wd": 0.05753506682683021, "epoch": 42}
44
+ {"train_loss": 5.240522819886104, "train_lr": 0.0019348979459864015, "train_wd": 0.058355443521444686, "epoch": 43}
45
+ {"train_loss": 5.250755113258446, "train_lr": 0.001930999496290417, "train_wd": 0.05919354636324573, "epoch": 44}
46
+ {"train_loss": 5.261200395610025, "train_lr": 0.0019269918483529214, "train_wd": 0.06004928344481208, "epoch": 45}
47
+ {"train_loss": 5.267244089802773, "train_lr": 0.0019228754724891616, "train_wd": 0.060922560924929446, "epoch": 46}
48
+ {"train_loss": 5.273745071282871, "train_lr": 0.0019186508517741035, "train_wd": 0.061813283038881124, "epoch": 47}
49
+ {"train_loss": 5.281555250799246, "train_lr": 0.0019143184819857208, "train_wd": 0.06272135210895002, "epoch": 48}
50
+ {"train_loss": 5.284689280793344, "train_lr": 0.0019098788715468042, "train_wd": 0.06364666855512914, "epoch": 49}
51
+ {"train_loss": 5.290297240947933, "train_lr": 0.0019053325414653385, "train_wd": 0.06458913090604337, "epoch": 50}
52
+ {"train_loss": 5.296585520132363, "train_lr": 0.0019006800252733048, "train_wd": 0.06554863581007495, "epoch": 51}
53
+ {"train_loss": 5.30230634427852, "train_lr": 0.0018959218689641123, "train_wd": 0.06652507804669865, "epoch": 52}
54
+ {"train_loss": 5.303765681721895, "train_lr": 0.0018910586309284967, "train_wd": 0.0675183505380198, "epoch": 53}
55
+ {"train_loss": 5.305392554862132, "train_lr": 0.0018860908818890158, "train_wd": 0.06852834436051636, "epoch": 54}
56
+ {"train_loss": 5.30649539551956, "train_lr": 0.0018810192048330206, "train_wd": 0.06955494875698406, "epoch": 55}
57
+ {"train_loss": 5.307509671464908, "train_lr": 0.001875844194944322, "train_wd": 0.07059805114868235, "epoch": 56}
58
+ {"train_loss": 5.307696122512352, "train_lr": 0.0018705664595332699, "train_wd": 0.07165753714767913, "epoch": 57}
59
+ {"train_loss": 5.307701090566641, "train_lr": 0.0018651866179655167, "train_wd": 0.07273329056939522, "epoch": 58}
60
+ {"train_loss": 5.306215801684976, "train_lr": 0.0018597053015893122, "train_wd": 0.07382519344534542, "epoch": 59}
61
+ {"train_loss": 5.300901007237766, "train_lr": 0.0018541231536614517, "train_wd": 0.07493312603607465, "epoch": 60}
62
+ {"train_loss": 5.300911074586147, "train_lr": 0.001848440829271734, "train_wd": 0.0760569668442891, "epoch": 61}
63
+ {"train_loss": 5.295829151460021, "train_lr": 0.001842658995266125, "train_wd": 0.07719659262817957, "epoch": 62}
64
+ {"train_loss": 5.296168923306523, "train_lr": 0.00183677833016848, "train_wd": 0.07835187841493665, "epoch": 63}
65
+ {"train_loss": 5.294507924315455, "train_lr": 0.0018307995241009147, "train_wd": 0.07952269751445465, "epoch": 64}
66
+ {"train_loss": 5.29376330445234, "train_lr": 0.001824723278702842, "train_wd": 0.08070892153322547, "epoch": 65}
67
+ {"train_loss": 5.292828523116908, "train_lr": 0.0018185503070485885, "train_wd": 0.081910420388418, "epoch": 66}
68
+ {"train_loss": 5.293003456031295, "train_lr": 0.0018122813335637626, "train_wd": 0.08312706232214329, "epoch": 67}
69
+ {"train_loss": 5.289439716523023, "train_lr": 0.0018059170939401807, "train_wd": 0.08435871391590259, "epoch": 68}
70
+ {"train_loss": 5.28995148774436, "train_lr": 0.0017994583350495893, "train_wd": 0.08560524010521922, "epoch": 69}
71
+ {"train_loss": 5.291336945230536, "train_lr": 0.0017929058148559815, "train_wd": 0.0868665041944498, "epoch": 70}
72
+ {"train_loss": 5.29063029674222, "train_lr": 0.0017862603023266462, "train_wd": 0.08814236787177346, "epoch": 71}
73
+ {"train_loss": 5.295422261758007, "train_lr": 0.0017795225773419537, "train_wd": 0.08943269122436058, "epoch": 72}
74
+ {"train_loss": 5.292081625198574, "train_lr": 0.0017726934306037977, "train_wd": 0.09073733275371443, "epoch": 73}
75
+ {"train_loss": 5.2921777883593695, "train_lr": 0.001765773663542838, "train_wd": 0.0920561493911902, "epoch": 74}
76
+ {"train_loss": 5.295905660930202, "train_lr": 0.001758764088224405, "train_wd": 0.09338899651368121, "epoch": 75}
77
+ {"train_loss": 5.295705769297411, "train_lr": 0.00175166552725325, "train_wd": 0.09473572795948056, "epoch": 76}
78
+ {"train_loss": 5.296104822394183, "train_lr": 0.0017444788136769661, "train_wd": 0.09609619604430945, "epoch": 77}
79
+ {"train_loss": 5.2982317376956285, "train_lr": 0.0017372047908882683, "train_wd": 0.09747025157751095, "epoch": 78}
80
+ {"train_loss": 5.300806172078938, "train_lr": 0.0017298443125259803, "train_wd": 0.09885774387841192, "epoch": 79}
81
+ {"train_loss": 5.301281621011136, "train_lr": 0.0017223982423748654, "train_wd": 0.10025852079284558, "epoch": 80}
82
+ {"train_loss": 5.301094462188313, "train_lr": 0.0017148674542642765, "train_wd": 0.10167242870983802, "epoch": 81}
83
+ {"train_loss": 5.3047993360139385, "train_lr": 0.0017072528319655872, "train_wd": 0.10309931257845319, "epoch": 82}
84
+ {"train_loss": 5.318680637722298, "train_lr": 0.0016995552690884806, "train_wd": 0.10453901592479503, "epoch": 83}
85
+ {"train_loss": 5.305510156065059, "train_lr": 0.0016917756689760982, "train_wd": 0.1059913808691678, "epoch": 84}
86
+ {"train_loss": 5.307846314663128, "train_lr": 0.0016839149445989994, "train_wd": 0.10745624814338853, "epoch": 85}
87
+ {"train_loss": 5.309804617977448, "train_lr": 0.0016759740184480443, "train_wd": 0.10893345710825322, "epoch": 86}
88
+ {"train_loss": 5.310509918524112, "train_lr": 0.0016679538224261272, "train_wd": 0.11042284577115233, "epoch": 87}
89
+ {"train_loss": 5.312336324216079, "train_lr": 0.0016598552977388093, "train_wd": 0.1119242508038345, "epoch": 88}
90
+ {"train_loss": 5.3098682396465255, "train_lr": 0.0016516793947838632, "train_wd": 0.11343750756031944, "epoch": 89}
91
+ {"train_loss": 5.312544189054045, "train_lr": 0.0016434270730397637, "train_wd": 0.11496245009495011, "epoch": 90}
92
+ {"train_loss": 5.315520610073678, "train_lr": 0.0016350993009530462, "train_wd": 0.11649891118059391, "epoch": 91}
93
+ {"train_loss": 5.316452932920006, "train_lr": 0.0016266970558246976, "train_wd": 0.11804672232697795, "epoch": 92}
94
+ {"train_loss": 5.316919739297826, "train_lr": 0.001618221323695426, "train_wd": 0.11960571379916764, "epoch": 93}
95
+ {"train_loss": 5.318144990886144, "train_lr": 0.0016096730992299843, "train_wd": 0.12117571463618018, "epoch": 94}
96
+ {"train_loss": 5.320191324638615, "train_lr": 0.0016010533856004134, "train_wd": 0.12275655266973115, "epoch": 95}
97
+ {"train_loss": 5.321631331237958, "train_lr": 0.0015923631943683242, "train_wd": 0.1243480545431163, "epoch": 96}
98
+ {"train_loss": 5.323321582768842, "train_lr": 0.001583603545366187, "train_wd": 0.12595004573021978, "epoch": 97}
99
+ {"train_loss": 5.32424541817104, "train_lr": 0.0015747754665776546, "train_wd": 0.12756235055465595, "epoch": 98}
100
+ {"train_loss": 5.32801631533747, "train_lr": 0.0015658799940169088, "train_wd": 0.12918479220903117, "epoch": 99}
101
+ {"train_loss": 5.328453638451657, "train_lr": 0.0015569181716071012, "train_wd": 0.1308171927743354, "epoch": 100}
102
+ {"train_loss": 5.329449989693723, "train_lr": 0.001547891051057821, "train_wd": 0.13245937323945048, "epoch": 101}
103
+ {"train_loss": 5.332335817704289, "train_lr": 0.001538799691741689, "train_wd": 0.13411115352078318, "epoch": 102}
104
+ {"train_loss": 5.334359170245134, "train_lr": 0.0015296451605700371, "train_wd": 0.1357723524820118, "epoch": 103}
105
+ {"train_loss": 5.33590655573171, "train_lr": 0.0015204285318676787, "train_wd": 0.13744278795395, "epoch": 104}
106
+ {"train_loss": 5.33658836845109, "train_lr": 0.0015111508872468603, "train_wd": 0.13912227675452407, "epoch": 105}
107
+ {"train_loss": 5.338837469772374, "train_lr": 0.0015018133154803177, "train_wd": 0.1408106347088607, "epoch": 106}
108
+ {"train_loss": 5.3418797508513425, "train_lr": 0.0014924169123734913, "train_wd": 0.14250767666948544, "epoch": 107}
109
+ {"train_loss": 5.344305904077397, "train_lr": 0.0014829627806359437, "train_wd": 0.1442132165366222, "epoch": 108}
110
+ {"train_loss": 5.343373100081984, "train_lr": 0.0014734520297519642, "train_wd": 0.1459270672786049, "epoch": 109}
111
+ {"train_loss": 5.3468826347641905, "train_lr": 0.0014638857758503276, "train_wd": 0.14764904095238682, "epoch": 110}
112
+ {"train_loss": 5.346389308226385, "train_lr": 0.0014542651415733513, "train_wd": 0.14937894872414936, "epoch": 111}
113
+ {"train_loss": 5.346873555704653, "train_lr": 0.0014445912559451185, "train_wd": 0.15111660089001122, "epoch": 112}
114
+ {"train_loss": 5.3459897055852705, "train_lr": 0.0014348652542389949, "train_wd": 0.1528618068968313, "epoch": 113}
115
+ {"train_loss": 5.346510966976198, "train_lr": 0.0014250882778444123, "train_wd": 0.15461437536310293, "epoch": 114}
116
+ {"train_loss": 5.347325504135838, "train_lr": 0.0014152614741328984, "train_wd": 0.1563741140999457, "epoch": 115}
117
+ {"train_loss": 5.349009832484926, "train_lr": 0.0014053859963234353, "train_wd": 0.1581408301321759, "epoch": 116}
118
+ {"train_loss": 5.3514899236978675, "train_lr": 0.00139546300334713, "train_wd": 0.1599143297194714, "epoch": 117}
119
+ {"train_loss": 5.351641595149212, "train_lr": 0.0013854936597112062, "train_wd": 0.16169441837761694, "epoch": 118}
120
+ {"train_loss": 5.3536441161049355, "train_lr": 0.0013754791353623405, "train_wd": 0.16348090089983194, "epoch": 119}
121
+ {"train_loss": 5.353606934694173, "train_lr": 0.0013654206055493682, "train_wd": 0.1652735813781757, "epoch": 120}
122
+ {"train_loss": 5.354507647639365, "train_lr": 0.0013553192506853583, "train_wd": 0.16707226322503174, "epoch": 121}
123
+ {"train_loss": 5.355904163192693, "train_lr": 0.0013451762562090913, "train_wd": 0.1688767491946666, "epoch": 122}
124
+ {"train_loss": 5.354328019751443, "train_lr": 0.0013349928124459425, "train_wd": 0.17068684140485862, "epoch": 123}
125
+ {"train_loss": 5.3554320165055165, "train_lr": 0.0013247701144681887, "train_wd": 0.17250234135860018, "epoch": 124}
126
+ {"train_loss": 5.355305136727105, "train_lr": 0.0013145093619547589, "train_wd": 0.1743230499658613, "epoch": 125}
127
+ {"train_loss": 5.355684284659789, "train_lr": 0.0013042117590504607, "train_wd": 0.17614876756542594, "epoch": 126}
128
+ {"train_loss": 5.355934019497544, "train_lr": 0.0012938785142246451, "train_wd": 0.17797929394678566, "epoch": 127}
129
+ {"train_loss": 5.356933341442729, "train_lr": 0.0012835108401294151, "train_wd": 0.1798144283720939, "epoch": 128}
130
+ {"train_loss": 5.356398239934283, "train_lr": 0.0012731099534572874, "train_wd": 0.1816539695981824, "epoch": 129}
131
+ {"train_loss": 5.355753288113719, "train_lr": 0.0012626770747984337, "train_wd": 0.1834977158986244, "epoch": 130}
132
+ {"train_loss": 5.355908048524559, "train_lr": 0.0012522134284974138, "train_wd": 0.18534546508586172, "epoch": 131}
133
+ {"train_loss": 5.356991463094402, "train_lr": 0.0012417202425095224, "train_wd": 0.18719701453337284, "epoch": 132}
134
+ {"train_loss": 5.355122434149544, "train_lr": 0.001231198748256656, "train_wd": 0.18905216119789686, "epoch": 133}
135
+ {"train_loss": 5.355967886751886, "train_lr": 0.0012206501804828127, "train_wd": 0.19091070164169655, "epoch": 134}
136
+ {"train_loss": 5.357231252961498, "train_lr": 0.001210075777109198, "train_wd": 0.19277243205486666, "epoch": 135}
137
+ {"train_loss": 5.3566089267496295, "train_lr": 0.0011994767790889276, "train_wd": 0.19463714827768913, "epoch": 136}
138
+ {"train_loss": 5.357098487212504, "train_lr": 0.0011888544302614131, "train_wd": 0.19650464582301674, "epoch": 137}
139
+ {"train_loss": 5.356014641807329, "train_lr": 0.0011782099772063817, "train_wd": 0.19837471989869845, "epoch": 138}
140
+ {"train_loss": 5.356016622935172, "train_lr": 0.0011675446690976045, "train_wd": 0.20024716543003776, "epoch": 139}
141
+ {"train_loss": 5.357441375271784, "train_lr": 0.0011568597575562672, "train_wd": 0.20212177708228213, "epoch": 140}
142
+ {"train_loss": 5.357439700100157, "train_lr": 0.001146156496504119, "train_wd": 0.20399834928313787, "epoch": 141}
143
+ {"train_loss": 5.357387976966602, "train_lr": 0.0011354361420162988, "train_wd": 0.20587667624531794, "epoch": 142}
144
+ {"train_loss": 5.3559060115560735, "train_lr": 0.001124699952173936, "train_wd": 0.20775655198910256, "epoch": 143}
145
+ {"train_loss": 5.354808613121938, "train_lr": 0.0011139491869165093, "train_wd": 0.20963777036493306, "epoch": 144}
146
+ {"train_loss": 5.351922285833138, "train_lr": 0.0011031851078939937, "train_wd": 0.21152012507601464, "epoch": 145}
147
+ {"train_loss": 5.35377579277082, "train_lr": 0.0010924089783187806, "train_wd": 0.2134034097009406, "epoch": 146}
148
+ {"train_loss": 5.351995900976096, "train_lr": 0.0010816220628174608, "train_wd": 0.21528741771633014, "epoch": 147}
149
+ {"train_loss": 5.350265190660429, "train_lr": 0.001070825627282391, "train_wd": 0.217171942519473, "epoch": 148}
150
+ {"train_loss": 5.349177232510942, "train_lr": 0.0010600209387231492, "train_wd": 0.21905677745098834, "epoch": 149}
151
+ {"train_loss": 5.3485994441665525, "train_lr": 0.0010492092651178493, "train_wd": 0.22094171581748476, "epoch": 150}
152
+ {"train_loss": 5.3443039077982535, "train_lr": 0.0010383918752643211, "train_wd": 0.22282655091422968, "epoch": 151}
153
+ {"train_loss": 5.3429892399042345, "train_lr": 0.0010275700386312263, "train_wd": 0.22471107604781423, "epoch": 152}
154
+ {"train_loss": 5.341276060500972, "train_lr": 0.0010167450252090754, "train_wd": 0.22659508455882188, "epoch": 153}
155
+ {"train_loss": 5.339956222320918, "train_lr": 0.0010059181053611898, "train_wd": 0.22847836984448705, "epoch": 154}
156
+ {"train_loss": 5.338739819878297, "train_lr": 0.0009950905496746184, "train_wd": 0.23036072538135743, "epoch": 155}
157
+ {"train_loss": 5.33691573617079, "train_lr": 0.0009842636288110262, "train_wd": 0.2322419447479335, "epoch": 156}
158
+ {"train_loss": 5.333186289937281, "train_lr": 0.0009734386133575811, "train_wd": 0.23412182164731465, "epoch": 157}
159
+ {"train_loss": 5.332632420755786, "train_lr": 0.0009626167736778422, "train_wd": 0.2360001499298133, "epoch": 158}
160
+ {"train_loss": 5.331472542312601, "train_lr": 0.0009517993797626801, "train_wd": 0.23787672361556705, "epoch": 159}
161
+ {"train_loss": 5.327957806255606, "train_lr": 0.0009409877010812298, "train_wd": 0.23975133691712414, "epoch": 160}
162
+ {"train_loss": 5.326287980702856, "train_lr": 0.0009301830064319187, "train_wd": 0.24162378426201056, "epoch": 161}
163
+ {"train_loss": 5.323021064106699, "train_lr": 0.0009193865637935735, "train_wd": 0.2434938603152749, "epoch": 162}
164
+ {"train_loss": 5.322141060535666, "train_lr": 0.0009085996401766097, "train_wd": 0.24536136000200406, "epoch": 163}
165
+ {"train_loss": 5.319853870417003, "train_lr": 0.0008978235014743327, "train_wd": 0.24722607852981315, "epoch": 164}
166
+ {"train_loss": 5.316981103327825, "train_lr": 0.0008870594123144038, "train_wd": 0.2490878114112999, "epoch": 165}
167
+ {"train_loss": 5.315526246071624, "train_lr": 0.0008763086359104094, "train_wd": 0.2509463544864762, "epoch": 166}
168
+ {"train_loss": 5.312530470504273, "train_lr": 0.0008655724339136243, "train_wd": 0.2528015039451491, "epoch": 167}
169
+ {"train_loss": 5.308834480033886, "train_lr": 0.0008548520662649607, "train_wd": 0.254653056349276, "epoch": 168}
170
+ {"train_loss": 5.30545787376275, "train_lr": 0.0008441487910470901, "train_wd": 0.2565008086552697, "epoch": 169}
171
+ {"train_loss": 5.302127437959377, "train_lr": 0.0008334638643368153, "train_wd": 0.2583445582362668, "epoch": 170}
172
+ {"train_loss": 5.299457348936754, "train_lr": 0.000822798540057662, "train_wd": 0.2601841029043497, "epoch": 171}
173
+ {"train_loss": 5.297182236072257, "train_lr": 0.0008121540698327205, "train_wd": 0.26201924093271484, "epoch": 172}
174
+ {"train_loss": 5.292786442547393, "train_lr": 0.0008015317028377698, "train_wd": 0.2638497710777995, "epoch": 173}
175
+ {"train_loss": 5.2893898485423465, "train_lr": 0.0007909326856546683, "train_wd": 0.2656754926013423, "epoch": 174}
176
+ {"train_loss": 5.286020152526889, "train_lr": 0.0007803582621250795, "train_wd": 0.26749620529240564, "epoch": 175}
177
+ {"train_loss": 5.28303490866193, "train_lr": 0.0007698096732044905, "train_wd": 0.2693117094893247, "epoch": 176}
178
+ {"train_loss": 5.280938950493086, "train_lr": 0.0007592881568165811, "train_wd": 0.27112180610160586, "epoch": 177}
179
+ {"train_loss": 5.277171620600325, "train_lr": 0.0007487949477079449, "train_wd": 0.27292629663175794, "epoch": 178}
180
+ {"train_loss": 5.273054663988231, "train_lr": 0.0007383312773031978, "train_wd": 0.2747249831970586, "epoch": 179}
181
+ {"train_loss": 5.270321273713185, "train_lr": 0.00072789837356046, "train_wd": 0.2765176685512585, "epoch": 180}
182
+ {"train_loss": 5.265006804613949, "train_lr": 0.000717497460827235, "train_wd": 0.27830415610620435, "epoch": 181}
183
+ {"train_loss": 5.26118450056163, "train_lr": 0.0007071297596967538, "train_wd": 0.2800842499534056, "epoch": 182}
184
+ {"train_loss": 5.258430524862451, "train_lr": 0.0006967964868647077, "train_wd": 0.2818577548855112, "epoch": 183}
185
+ {"train_loss": 5.254658599503988, "train_lr": 0.0006864988549864827, "train_wd": 0.2836244764177193, "epoch": 184}
186
+ {"train_loss": 5.250112573377234, "train_lr": 0.0006762380725348328, "train_wd": 0.2853842208091065, "epoch": 185}
187
+ {"train_loss": 5.246409534312171, "train_lr": 0.0006660153436580767, "train_wd": 0.2871367950838696, "epoch": 186}
188
+ {"train_loss": 5.240689671225399, "train_lr": 0.0006558318680387706, "train_wd": 0.2888820070524873, "epoch": 187}
189
+ {"train_loss": 5.235934831875024, "train_lr": 0.0006456888407529291, "train_wd": 0.29061966533280315, "epoch": 188}
190
+ {"train_loss": 5.232231075600755, "train_lr": 0.0006355874521297811, "train_wd": 0.2923495793710027, "epoch": 189}
191
+ {"train_loss": 5.2296532516142165, "train_lr": 0.0006255288876120631, "train_wd": 0.2940715594625201, "epoch": 190}
192
+ {"train_loss": 5.224616110038986, "train_lr": 0.0006155143276169212, "train_wd": 0.29578541677283016, "epoch": 191}
193
+ {"train_loss": 5.221290291618291, "train_lr": 0.0006055449473973712, "train_wd": 0.2974909633581683, "epoch": 192}
194
+ {"train_loss": 5.2147308859846095, "train_lr": 0.0005956219169043888, "train_wd": 0.2991880121861295, "epoch": 193}
195
+ {"train_loss": 5.210133640695628, "train_lr": 0.0005857464006495933, "train_wd": 0.3008763771561874, "epoch": 194}
196
+ {"train_loss": 5.204653665554418, "train_lr": 0.000575919557568606, "train_wd": 0.3025558731200963, "epoch": 195}
197
+ {"train_loss": 5.198422485475632, "train_lr": 0.0005661425408850318, "train_wd": 0.30422631590219695, "epoch": 196}
198
+ {"train_loss": 5.192577986003493, "train_lr": 0.0005564164979751273, "train_wd": 0.3058875223196151, "epoch": 197}
199
+ {"train_loss": 5.188118070959568, "train_lr": 0.0005467425702331502, "train_wd": 0.3075393102023465, "epoch": 198}
200
+ {"train_loss": 5.184111035151257, "train_lr": 0.000537121892937416, "train_wd": 0.3091814984132353, "epoch": 199}
201
+ {"train_loss": 5.178760282594046, "train_lr": 0.0005275555951170565, "train_wd": 0.31081390686783883, "epoch": 200}
202
+ {"train_loss": 5.175123964639591, "train_lr": 0.0005180447994195406, "train_wd": 0.31243635655417534, "epoch": 201}
203
+ {"train_loss": 5.168212484303329, "train_lr": 0.0005085906219789087, "train_wd": 0.3140486695523516, "epoch": 202}
204
+ {"train_loss": 5.164016685826029, "train_lr": 0.0004991941722848035, "train_wd": 0.31565066905408046, "epoch": 203}
205
+ {"train_loss": 5.158912756055188, "train_lr": 0.0004898565530522569, "train_wd": 0.31724217938206156, "epoch": 204}
206
+ {"train_loss": 5.151946374790655, "train_lr": 0.0004805788600922868, "train_wd": 0.31882302600925444, "epoch": 205}
207
+ {"train_loss": 5.147163253608081, "train_lr": 0.00047136218218329825, "train_wd": 0.32039303557801124, "epoch": 206}
208
+ {"train_loss": 5.139867486332437, "train_lr": 0.0004622076009433072, "train_wd": 0.32195203591908944, "epoch": 207}
209
+ {"train_loss": 5.134232663469826, "train_lr": 0.0004531161907030123, "train_wd": 0.3234998560705342, "epoch": 208}
210
+ {"train_loss": 5.128424988519088, "train_lr": 0.00044408901837971447, "train_wd": 0.32503632629642326, "epoch": 209}
211
+ {"train_loss": 5.1229675430759825, "train_lr": 0.0004351271433521113, "train_wd": 0.3265612781054832, "epoch": 210}
212
+ {"train_loss": 5.1169812633550995, "train_lr": 0.00042623161733597016, "train_wd": 0.3280745442695616, "epoch": 211}
213
+ {"train_loss": 5.109434343141904, "train_lr": 0.00041740348426070993, "train_wd": 0.3295759588419709, "epoch": 212}
214
+ {"train_loss": 5.103250536058161, "train_lr": 0.0004086437801468898, "train_wd": 0.33106535717568547, "epoch": 213}
215
+ {"train_loss": 5.0977142393636665, "train_lr": 0.0003999535329846263, "train_wd": 0.3325425759413923, "epoch": 214}
216
+ {"train_loss": 5.09096563303118, "train_lr": 0.0003913337626129549, "train_wd": 0.33400745314540786, "epoch": 215}
217
+ {"train_loss": 5.084373079305835, "train_lr": 0.0003827854806001447, "train_wd": 0.33545982814743885, "epoch": 216}
218
+ {"train_loss": 5.0776247274484945, "train_lr": 0.0003743096901249942, "train_wd": 0.3368995416781991, "epoch": 217}
219
+ {"train_loss": 5.071427017974434, "train_lr": 0.00036590738585909246, "train_wd": 0.3383264358568765, "epoch": 218}
220
+ {"train_loss": 5.064928268357146, "train_lr": 0.00035757955385010083, "train_wd": 0.33974035420844456, "epoch": 219}
221
+ {"train_loss": 5.057662455369528, "train_lr": 0.0003493271714060281, "train_wd": 0.3411411416808224, "epoch": 220}
222
+ {"train_loss": 5.052747223302901, "train_lr": 0.00034115120698054413, "train_wd": 0.3425286446618775, "epoch": 221}
223
+ {"train_loss": 5.045558305262185, "train_lr": 0.0003330526200593252, "train_wd": 0.3439027109962745, "epoch": 222}
224
+ {"train_loss": 5.038101597036198, "train_lr": 0.00032503236104745094, "train_wd": 0.34526319000215344, "epoch": 223}
225
+ {"train_loss": 5.030003580138933, "train_lr": 0.0003170913711578803, "train_wd": 0.34660993248766137, "epoch": 224}
226
+ {"train_loss": 5.023696114143117, "train_lr": 0.00030923058230098257, "train_wd": 0.34794279076730644, "epoch": 225}
227
+ {"train_loss": 5.0165140662881305, "train_lr": 0.0003014509169751841, "train_wd": 0.34926161867816086, "epoch": 226}
228
+ {"train_loss": 5.009698191849734, "train_lr": 0.0002937532881587045, "train_wd": 0.35056627159588083, "epoch": 227}
229
+ {"train_loss": 5.00137701840233, "train_lr": 0.0002861385992024148, "train_wd": 0.351856606450572, "epoch": 228}
230
+ {"train_loss": 4.994674074945213, "train_lr": 0.0002786077437238243, "train_wd": 0.353132481742477, "epoch": 229}
231
+ {"train_loss": 4.98764476906672, "train_lr": 0.00027116160550221506, "train_wd": 0.3543937575574922, "epoch": 230}
232
+ {"train_loss": 4.979976188602874, "train_lr": 0.00026380105837492217, "train_wd": 0.3556402955825113, "epoch": 231}
233
+ {"train_loss": 4.9719487094431285, "train_lr": 0.00025652696613478554, "train_wd": 0.3568719591205926, "epoch": 232}
234
+ {"train_loss": 4.9644304828154, "train_lr": 0.0002493401824287798, "train_wd": 0.3580886131059502, "epoch": 233}
235
+ {"train_loss": 4.956700345833334, "train_lr": 0.0002422415506578395, "train_wd": 0.35929012411876265, "epoch": 234}
236
+ {"train_loss": 4.948297347382104, "train_lr": 0.00023523190387787592, "train_wd": 0.36047636039980857, "epoch": 235}
237
+ {"train_loss": 4.9424779818450615, "train_lr": 0.00022831206470201763, "train_wd": 0.3616471918649123, "epoch": 236}
238
+ {"train_loss": 4.9327193981737825, "train_lr": 0.00022148284520407375, "train_wd": 0.3628024901192085, "epoch": 237}
239
+ {"train_loss": 4.92455313107569, "train_lr": 0.0002147450468232303, "train_wd": 0.36394212847122615, "epoch": 238}
240
+ {"train_loss": 4.917870346709884, "train_lr": 0.00020809946027000196, "train_wd": 0.36506598194677603, "epoch": 239}
241
+ {"train_loss": 4.907198251889859, "train_lr": 0.00020154686543343578, "train_wd": 0.3661739273026614, "epoch": 240}
242
+ {"train_loss": 4.900665078469984, "train_lr": 0.0001950880312895884, "train_wd": 0.3672658430401871, "epoch": 241}
243
+ {"train_loss": 4.89050177737868, "train_lr": 0.0001887237158112833, "train_wd": 0.3683416094184872, "epoch": 242}
244
+ {"train_loss": 4.882661578514212, "train_lr": 0.00018245466587916038, "train_wd": 0.3694011084676571, "epoch": 243}
245
+ {"train_loss": 4.873007433615523, "train_lr": 0.0001762816171940242, "train_wd": 0.3704442240016874, "epoch": 244}
246
+ {"train_loss": 4.863366123488386, "train_lr": 0.00017020529419050807, "train_wd": 0.3714708416312026, "epoch": 245}
247
+ {"train_loss": 4.855247921151794, "train_lr": 0.000164226409952058, "train_wd": 0.37248084877601123, "epoch": 246}
248
+ {"train_loss": 4.845685126350747, "train_lr": 0.00015834566612724755, "train_wd": 0.37347413467744817, "epoch": 247}
249
+ {"train_loss": 4.837190835119532, "train_lr": 0.0001525637528474392, "train_wd": 0.3744505904105231, "epoch": 248}
250
+ {"train_loss": 4.826414683811384, "train_lr": 0.000146881348645791, "train_wd": 0.37541010889585846, "epoch": 249}
251
+ {"train_loss": 4.816837973660417, "train_lr": 0.00014129912037763172, "train_wd": 0.37635258491144113, "epoch": 250}
252
+ {"train_loss": 4.806832356120852, "train_lr": 0.00013581772314219805, "train_wd": 0.37727791510415504, "epoch": 251}
253
+ {"train_loss": 4.797565344188044, "train_lr": 0.00013043780020575952, "train_wd": 0.3781859980011157, "epoch": 252}
254
+ {"train_loss": 4.787975496739793, "train_lr": 0.0001251599829261254, "train_wd": 0.37907673402080266, "epoch": 253}
255
+ {"train_loss": 4.778846158803129, "train_lr": 0.00011998489067855475, "train_wd": 0.37995002548397105, "epoch": 254}
256
+ {"train_loss": 4.769147366928539, "train_lr": 0.0001149131307830678, "train_wd": 0.3808057766243729, "epoch": 255}
257
+ {"train_loss": 4.758902791521246, "train_lr": 0.00010994529843317512, "train_wd": 0.3816438935992515, "epoch": 256}
258
+ {"train_loss": 4.74997969794807, "train_lr": 0.00010508197662602924, "train_wd": 0.3824642844996354, "epoch": 257}
259
+ {"train_loss": 4.74077859154041, "train_lr": 0.00010032373609400729, "train_wd": 0.38326685936041804, "epoch": 258}
260
+ {"train_loss": 4.731040912959501, "train_lr": 9.56711352377327e-05, "train_wd": 0.38405153017022187, "epoch": 259}
261
+ {"train_loss": 4.7222571982015715, "train_lr": 9.112472006054422e-05, "train_wd": 0.38481821088104945, "epoch": 260}
262
+ {"train_loss": 4.712104947327806, "train_lr": 8.668502410442095e-05, "train_wd": 0.3855668174177217, "epoch": 261}
263
+ {"train_loss": 4.702808143626109, "train_lr": 8.235256838736765e-05, "train_wd": 0.3862972676870952, "epoch": 262}
264
+ {"train_loss": 4.693713557531984, "train_lr": 7.812786134227221e-05, "train_wd": 0.3870094815870675, "epoch": 263}
265
+ {"train_loss": 4.682229380229775, "train_lr": 7.401139875723767e-05, "train_wd": 0.3877033810153572, "epoch": 264}
266
+ {"train_loss": 4.6731468029826475, "train_lr": 7.000366371739977e-05, "train_wd": 0.38837888987807484, "epoch": 265}
267
+ {"train_loss": 4.664330259668265, "train_lr": 6.610512654823477e-05, "train_wd": 0.38903593409805837, "epoch": 266}
268
+ {"train_loss": 4.656385099740146, "train_lr": 6.231624476036483e-05, "train_wd": 0.3896744416230066, "epoch": 267}
269
+ {"train_loss": 4.646662142279623, "train_lr": 5.8637462995866595e-05, "train_wd": 0.39029434243337324, "epoch": 268}
270
+ {"train_loss": 4.637298107016192, "train_lr": 5.5069212976091174e-05, "train_wd": 0.3908955685500501, "epoch": 269}
271
+ {"train_loss": 4.625819423275409, "train_lr": 5.161191345099935e-05, "train_wd": 0.39147805404181696, "epoch": 270}
272
+ {"train_loss": 4.61837213762182, "train_lr": 4.826597015001902e-05, "train_wd": 0.3920417350325767, "epoch": 271}
273
+ {"train_loss": 4.6093446456437865, "train_lr": 4.5031775734431806e-05, "train_wd": 0.39258654970835427, "epoch": 272}
274
+ {"train_loss": 4.600542716282925, "train_lr": 4.190970975129205e-05, "train_wd": 0.39311243832408505, "epoch": 273}
275
+ {"train_loss": 4.5911011797227825, "train_lr": 3.890013858888553e-05, "train_wd": 0.3936193432101521, "epoch": 274}
276
+ {"train_loss": 4.583430806271655, "train_lr": 3.6003415433731646e-05, "train_wd": 0.3941072087787241, "epoch": 275}
277
+ {"train_loss": 4.57514800880548, "train_lr": 3.321988022913639e-05, "train_wd": 0.39457598152984424, "epoch": 276}
278
+ {"train_loss": 4.566035068923716, "train_lr": 3.054985963529725e-05, "train_wd": 0.39502561005729664, "epoch": 277}
279
+ {"train_loss": 4.5569964723406935, "train_lr": 2.799366699096945e-05, "train_wd": 0.39545604505424736, "epoch": 278}
280
+ {"train_loss": 4.549356738309399, "train_lr": 2.555160227669323e-05, "train_wd": 0.3958672393186477, "epoch": 279}
281
+ {"train_loss": 4.542794259129573, "train_lr": 2.322395207959048e-05, "train_wd": 0.39625914775841237, "epoch": 280}
282
+ {"train_loss": 4.53448782769515, "train_lr": 2.1010989559732036e-05, "train_wd": 0.3966317273963664, "epoch": 281}
283
+ {"train_loss": 4.528655390981004, "train_lr": 1.891297441808141e-05, "train_wd": 0.3969849373749528, "epoch": 282}
284
+ {"train_loss": 4.522289742501996, "train_lr": 1.6930152866017515e-05, "train_wd": 0.3973187389607159, "epoch": 283}
285
+ {"train_loss": 4.514690550837776, "train_lr": 1.5062757596440936e-05, "train_wd": 0.39763309554855275, "epoch": 284}
286
+ {"train_loss": 4.508909112984519, "train_lr": 1.3311007756466215e-05, "train_wd": 0.39792797266571783, "epoch": 285}
287
+ {"train_loss": 4.502513048364866, "train_lr": 1.1675108921703887e-05, "train_wd": 0.3982033379756162, "epoch": 286}
288
+ {"train_loss": 4.497596346419588, "train_lr": 1.0155253072135383e-05, "train_wd": 0.3984591612813356, "epoch": 287}
289
+ {"train_loss": 4.493581289403158, "train_lr": 8.7516185695834e-06, "train_wd": 0.39869541452896834, "epoch": 288}
290
+ {"train_loss": 4.488790155588675, "train_lr": 7.464370136780158e-06, "train_wd": 0.39891207181068383, "epoch": 289}
291
+ {"train_loss": 4.484065244869172, "train_lr": 6.293658838036681e-06, "train_wd": 0.39910910936756855, "epoch": 290}
292
+ {"train_loss": 4.480979661623255, "train_lr": 5.2396220615144845e-06, "train_wd": 0.39928650559223694, "epoch": 291}
293
+ {"train_loss": 4.476422199170938, "train_lr": 4.302383503102697e-06, "train_wd": 0.3994442410311896, "epoch": 292}
294
+ {"train_loss": 4.473310585704734, "train_lr": 3.482053151901624e-06, "train_wd": 0.399582298386962, "epoch": 293}
295
+ {"train_loss": 4.471176154726892, "train_lr": 2.778727277315148e-06, "train_wd": 0.3997006625200075, "epoch": 294}
296
+ {"train_loss": 4.468422725570383, "train_lr": 2.192488417753049e-06, "train_wd": 0.399799320450365, "epoch": 295}
297
+ {"train_loss": 4.468255913836493, "train_lr": 1.7234053709447294e-06, "train_wd": 0.39987826135908094, "epoch": 296}
298
+ {"train_loss": 4.465327120572924, "train_lr": 1.3715331858655515e-06, "train_wd": 0.3999374765893954, "epoch": 297}
299
+ {"train_loss": 4.4642800721976394, "train_lr": 1.136913156276552e-06, "train_wd": 0.3999769596476907, "epoch": 298}
300
+ {"train_loss": 4.464623126456682, "train_lr": 1.0195728158784548e-06, "train_wd": 0.39999670620420386, "epoch": 299}
Vim/Tiny/log_eval.txt ADDED
@@ -0,0 +1,100 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"train_lr": 0.0019999999999998686, "train_loss": 1.9394195398127514, "epoch": 0, "test_loss": 1.3299601733913202, "test_acc1": 67.352, "test_acc5": 88.246}
2
+ {"train_lr": 0.0019995065603657376, "train_loss": 1.4895059365750882, "epoch": 1, "test_loss": 1.2500209893716876, "test_acc1": 69.202, "test_acc5": 89.39}
3
+ {"train_lr": 0.0019980267284282105, "train_loss": 1.4050731192492887, "epoch": 2, "test_loss": 1.2093816739900032, "test_acc1": 70.214, "test_acc5": 89.722}
4
+ {"train_lr": 0.001995561964603092, "train_loss": 1.3557268998597176, "epoch": 3, "test_loss": 1.1917529543647376, "test_acc1": 70.428, "test_acc5": 89.984}
5
+ {"train_lr": 0.0019921147013145773, "train_loss": 1.3201949973845548, "epoch": 4, "test_loss": 1.1704205622148636, "test_acc1": 70.988, "test_acc5": 90.272}
6
+ {"train_lr": 0.0019876883405950175, "train_loss": 1.2950622001458205, "epoch": 5, "test_loss": 1.1628179901929767, "test_acc1": 70.964, "test_acc5": 90.498}
7
+ {"train_lr": 0.0019822872507288198, "train_loss": 1.2788213456136628, "epoch": 6, "test_loss": 1.1616404151062831, "test_acc1": 71.326, "test_acc5": 90.298}
8
+ {"train_lr": 0.0019759167619387524, "train_loss": 1.2601114897562702, "epoch": 7, "test_loss": 1.1566813130817755, "test_acc1": 71.296, "test_acc5": 90.344}
9
+ {"train_lr": 0.001968583161128624, "train_loss": 1.2457857671209778, "epoch": 8, "test_loss": 1.1448852566578198, "test_acc1": 71.712, "test_acc5": 90.534}
10
+ {"train_lr": 0.001960293685677003, "train_loss": 1.234269193754261, "epoch": 9, "test_loss": 1.1460910282095376, "test_acc1": 71.392, "test_acc5": 90.59}
11
+ {"train_lr": 0.0019510565162951365, "train_loss": 1.224008701631559, "epoch": 10, "test_loss": 1.1481351356219758, "test_acc1": 71.516, "test_acc5": 90.494}
12
+ {"train_lr": 0.0019408807689541316, "train_loss": 1.2149226944171758, "epoch": 11, "test_loss": 1.1432129745669377, "test_acc1": 71.594, "test_acc5": 90.594}
13
+ {"train_lr": 0.0019297764858882515, "train_loss": 1.2047593642712306, "epoch": 12, "test_loss": 1.1257584109864271, "test_acc1": 71.966, "test_acc5": 90.71}
14
+ {"train_lr": 0.0019177546256839834, "train_loss": 1.1984074112657448, "epoch": 13, "test_loss": 1.1318223365127582, "test_acc1": 71.786, "test_acc5": 90.774}
15
+ {"train_lr": 0.0019048270524661083, "train_loss": 1.1934852913004181, "epoch": 14, "test_loss": 1.1335975052526845, "test_acc1": 71.832, "test_acc5": 90.742}
16
+ {"train_lr": 0.0018910065241883177, "train_loss": 1.1838929758481964, "epoch": 15, "test_loss": 1.1268517046861941, "test_acc1": 72.07, "test_acc5": 90.796}
17
+ {"train_lr": 0.0018763066800438779, "train_loss": 1.1790978701184665, "epoch": 16, "test_loss": 1.1284329878628407, "test_acc1": 71.996, "test_acc5": 90.72}
18
+ {"train_lr": 0.0018607420270040137, "train_loss": 1.1743117745904699, "epoch": 17, "test_loss": 1.1267351508140564, "test_acc1": 71.968, "test_acc5": 90.738}
19
+ {"train_lr": 0.001844327925502041, "train_loss": 1.167326608956265, "epoch": 18, "test_loss": 1.1219729225882484, "test_acc1": 72.064, "test_acc5": 90.88}
20
+ {"train_lr": 0.0018270805742745338, "train_loss": 1.1614796393723952, "epoch": 19, "test_loss": 1.122248386254396, "test_acc1": 71.986, "test_acc5": 90.846}
21
+ {"train_lr": 0.0018090169943749148, "train_loss": 1.1579939072316903, "epoch": 20, "test_loss": 1.117832330334217, "test_acc1": 72.244, "test_acc5": 90.91}
22
+ {"train_lr": 0.001790155012375684, "train_loss": 1.1517065800086432, "epoch": 21, "test_loss": 1.1216408789843855, "test_acc1": 72.06, "test_acc5": 90.914}
23
+ {"train_lr": 0.00177051324277586, "train_loss": 1.146630821361858, "epoch": 22, "test_loss": 1.1244902985785015, "test_acc1": 72.196, "test_acc5": 90.788}
24
+ {"train_lr": 0.0017501110696303821, "train_loss": 1.1404163108984566, "epoch": 23, "test_loss": 1.1199206392783339, "test_acc1": 72.124, "test_acc5": 90.8}
25
+ {"train_lr": 0.001728968627421389, "train_loss": 1.1397176145721424, "epoch": 24, "test_loss": 1.1174130469865506, "test_acc1": 72.452, "test_acc5": 90.928}
26
+ {"train_lr": 0.0017071067811865767, "train_loss": 1.1347195509489278, "epoch": 25, "test_loss": 1.1164292820426813, "test_acc1": 72.306, "test_acc5": 90.812}
27
+ {"train_lr": 0.0016845471059286062, "train_loss": 1.1293862803704826, "epoch": 26, "test_loss": 1.116272209893407, "test_acc1": 72.3, "test_acc5": 90.932}
28
+ {"train_lr": 0.001661311865323677, "train_loss": 1.1267507408577777, "epoch": 27, "test_loss": 1.1138558283714992, "test_acc1": 72.472, "test_acc5": 90.986}
29
+ {"train_lr": 0.001637423989748733, "train_loss": 1.1217202165223958, "epoch": 28, "test_loss": 1.1122960829368942, "test_acc1": 72.408, "test_acc5": 91.02}
30
+ {"train_lr": 0.001612907053652909, "train_loss": 1.1191584713283749, "epoch": 29, "test_loss": 1.1097518093598164, "test_acc1": 72.404, "test_acc5": 90.994}
31
+ {"train_lr": 0.0015877852522924111, "train_loss": 1.1161460292801302, "epoch": 30, "test_loss": 1.1123244903429086, "test_acc1": 72.41, "test_acc5": 91.016}
32
+ {"train_lr": 0.0015620833778521046, "train_loss": 1.1115648148122235, "epoch": 31, "test_loss": 1.107154603009029, "test_acc1": 72.594, "test_acc5": 90.986}
33
+ {"train_lr": 0.0015358267949790963, "train_loss": 1.108296306968283, "epoch": 32, "test_loss": 1.1072572523065844, "test_acc1": 72.628, "test_acc5": 90.928}
34
+ {"train_lr": 0.0015090414157503675, "train_loss": 1.1032026825168348, "epoch": 33, "test_loss": 1.103592855279403, "test_acc1": 72.638, "test_acc5": 90.982}
35
+ {"train_lr": 0.0014817536741017646, "train_loss": 1.1019247201707807, "epoch": 34, "test_loss": 1.1021103329975586, "test_acc1": 72.61, "test_acc5": 90.996}
36
+ {"train_lr": 0.001453990499739611, "train_loss": 1.0978659956373313, "epoch": 35, "test_loss": 1.107620112559832, "test_acc1": 72.58, "test_acc5": 90.922}
37
+ {"train_lr": 0.0014257792915651636, "train_loss": 1.0946717398658639, "epoch": 36, "test_loss": 1.1041595811581673, "test_acc1": 72.488, "test_acc5": 91.06}
38
+ {"train_lr": 0.001397147890634744, "train_loss": 1.0919734213145504, "epoch": 37, "test_loss": 1.1012236876484682, "test_acc1": 72.672, "test_acc5": 91.084}
39
+ {"train_lr": 0.001368124552684745, "train_loss": 1.0886381687019713, "epoch": 38, "test_loss": 1.098489917567014, "test_acc1": 72.734, "test_acc5": 91.022}
40
+ {"train_lr": 0.0013387379202453142, "train_loss": 1.0866897209460764, "epoch": 39, "test_loss": 1.098137907169359, "test_acc1": 72.72, "test_acc5": 91.03}
41
+ {"train_lr": 0.0013090169943749093, "train_loss": 1.0830197254753189, "epoch": 40, "test_loss": 1.0984532511828806, "test_acc1": 72.654, "test_acc5": 91.082}
42
+ {"train_lr": 0.0012789911060391633, "train_loss": 1.0805857636918557, "epoch": 41, "test_loss": 1.0907364895810252, "test_acc1": 72.924, "test_acc5": 91.292}
43
+ {"train_lr": 0.0012486898871647862, "train_loss": 1.0789034249386786, "epoch": 42, "test_loss": 1.0983302168681492, "test_acc1": 72.672, "test_acc5": 91.154}
44
+ {"train_lr": 0.001218143241396569, "train_loss": 1.0752621524146067, "epoch": 43, "test_loss": 1.0961631286479627, "test_acc1": 72.736, "test_acc5": 91.198}
45
+ {"train_lr": 0.0011873813145856604, "train_loss": 1.070425175115484, "epoch": 44, "test_loss": 1.0946691412373881, "test_acc1": 72.846, "test_acc5": 91.178}
46
+ {"train_lr": 0.0011564344650402871, "train_loss": 1.0677069343605663, "epoch": 45, "test_loss": 1.092641483334934, "test_acc1": 72.824, "test_acc5": 91.092}
47
+ {"train_lr": 0.0011253332335643327, "train_loss": 1.0661474971403564, "epoch": 46, "test_loss": 1.0894057868462999, "test_acc1": 72.796, "test_acc5": 91.246}
48
+ {"train_lr": 0.001094108313318475, "train_loss": 1.0652352349726237, "epoch": 47, "test_loss": 1.0903175639374483, "test_acc1": 72.904, "test_acc5": 91.226}
49
+ {"train_lr": 0.0010627905195293463, "train_loss": 1.0607659826922122, "epoch": 48, "test_loss": 1.0880373155750582, "test_acc1": 72.872, "test_acc5": 91.198}
50
+ {"train_lr": 0.0010314107590780974, "train_loss": 1.05850977698565, "epoch": 49, "test_loss": 1.0873476263431028, "test_acc1": 72.896, "test_acc5": 91.194}
51
+ {"train_lr": 0.0009999999999999343, "train_loss": 1.0560046185791803, "epoch": 50, "test_loss": 1.085933249053138, "test_acc1": 72.966, "test_acc5": 91.224}
52
+ {"train_lr": 0.0009685892409218651, "train_loss": 1.05410830355374, "epoch": 51, "test_loss": 1.0843035926675553, "test_acc1": 72.998, "test_acc5": 91.182}
53
+ {"train_lr": 0.0009372094804707101, "train_loss": 1.0522097808227413, "epoch": 52, "test_loss": 1.083007411083297, "test_acc1": 73.176, "test_acc5": 91.296}
54
+ {"train_lr": 0.0009058916866814987, "train_loss": 1.0484336283068347, "epoch": 53, "test_loss": 1.0820611955793313, "test_acc1": 73.018, "test_acc5": 91.266}
55
+ {"train_lr": 0.0008746667664356905, "train_loss": 1.045933330762734, "epoch": 54, "test_loss": 1.0865987877902168, "test_acc1": 73.03, "test_acc5": 91.294}
56
+ {"train_lr": 0.0008435655349597399, "train_loss": 1.044268217472091, "epoch": 55, "test_loss": 1.0776301011100144, "test_acc1": 73.194, "test_acc5": 91.286}
57
+ {"train_lr": 0.0008126186854142688, "train_loss": 1.041966896987871, "epoch": 56, "test_loss": 1.076266079988626, "test_acc1": 73.194, "test_acc5": 91.316}
58
+ {"train_lr": 0.0007818567586034925, "train_loss": 1.0412271602411913, "epoch": 57, "test_loss": 1.0766167737486418, "test_acc1": 73.216, "test_acc5": 91.266}
59
+ {"train_lr": 0.0007513101128351359, "train_loss": 1.0351296110994759, "epoch": 58, "test_loss": 1.0760000863534105, "test_acc1": 73.18, "test_acc5": 91.302}
60
+ {"train_lr": 0.000721008893960812, "train_loss": 1.035528433653911, "epoch": 59, "test_loss": 1.0766144641639326, "test_acc1": 73.306, "test_acc5": 91.356}
61
+ {"train_lr": 0.0006909830056250302, "train_loss": 1.0342691602156346, "epoch": 60, "test_loss": 1.0745683335282308, "test_acc1": 73.346, "test_acc5": 91.34}
62
+ {"train_lr": 0.0006612620797547435, "train_loss": 1.0328092442879762, "epoch": 61, "test_loss": 1.073943282560924, "test_acc1": 73.328, "test_acc5": 91.256}
63
+ {"train_lr": 0.0006318754473153419, "train_loss": 1.0284020406719785, "epoch": 62, "test_loss": 1.072020601395451, "test_acc1": 73.3, "test_acc5": 91.346}
64
+ {"train_lr": 0.0006028521093652263, "train_loss": 1.0257388040143587, "epoch": 63, "test_loss": 1.070684483384385, "test_acc1": 73.35, "test_acc5": 91.294}
65
+ {"train_lr": 0.000574220708434935, "train_loss": 1.0248928551632455, "epoch": 64, "test_loss": 1.0702000716153313, "test_acc1": 73.354, "test_acc5": 91.318}
66
+ {"train_lr": 0.0005460095002604524, "train_loss": 1.0226652788677741, "epoch": 65, "test_loss": 1.0710883680969248, "test_acc1": 73.342, "test_acc5": 91.292}
67
+ {"train_lr": 0.0005182463258982946, "train_loss": 1.0228851687935558, "epoch": 66, "test_loss": 1.068965321459124, "test_acc1": 73.378, "test_acc5": 91.374}
68
+ {"train_lr": 0.0004909585842496341, "train_loss": 1.0173290452651629, "epoch": 67, "test_loss": 1.0686252971210748, "test_acc1": 73.414, "test_acc5": 91.404}
69
+ {"train_lr": 0.0004641732050210111, "train_loss": 1.0183380305636087, "epoch": 68, "test_loss": 1.066566807077364, "test_acc1": 73.508, "test_acc5": 91.352}
70
+ {"train_lr": 0.0004379166221478616, "train_loss": 1.0156690546014144, "epoch": 69, "test_loss": 1.0662899416730838, "test_acc1": 73.418, "test_acc5": 91.408}
71
+ {"train_lr": 0.00041221474770750024, "train_loss": 1.0142113912227009, "epoch": 70, "test_loss": 1.0649737461143747, "test_acc1": 73.512, "test_acc5": 91.356}
72
+ {"train_lr": 0.0003870929463470055, "train_loss": 1.0131062789560794, "epoch": 71, "test_loss": 1.0620185296477564, "test_acc1": 73.612, "test_acc5": 91.48}
73
+ {"train_lr": 0.0003625760102513295, "train_loss": 1.0128220649264215, "epoch": 72, "test_loss": 1.063135371831677, "test_acc1": 73.482, "test_acc5": 91.4}
74
+ {"train_lr": 0.0003386881346763327, "train_loss": 1.0111924470828335, "epoch": 73, "test_loss": 1.0624794940585676, "test_acc1": 73.504, "test_acc5": 91.46}
75
+ {"train_lr": 0.0003154528940713109, "train_loss": 1.008184174698589, "epoch": 74, "test_loss": 1.0631436414807045, "test_acc1": 73.482, "test_acc5": 91.406}
76
+ {"train_lr": 0.00029289321881343744, "train_loss": 1.0071958508215997, "epoch": 75, "test_loss": 1.0615671491226577, "test_acc1": 73.53, "test_acc5": 91.436}
77
+ {"train_lr": 0.0002710313725785874, "train_loss": 1.0046371940882073, "epoch": 76, "test_loss": 1.0619150495818814, "test_acc1": 73.48, "test_acc5": 91.416}
78
+ {"train_lr": 0.0002498889303695469, "train_loss": 1.0025258157469252, "epoch": 77, "test_loss": 1.0603039739534372, "test_acc1": 73.544, "test_acc5": 91.42}
79
+ {"train_lr": 0.0002294867572242191, "train_loss": 1.0013484704169424, "epoch": 78, "test_loss": 1.0590004717450008, "test_acc1": 73.714, "test_acc5": 91.44}
80
+ {"train_lr": 0.0002098449876243195, "train_loss": 1.002150521057394, "epoch": 79, "test_loss": 1.0596403076749323, "test_acc1": 73.62, "test_acc5": 91.432}
81
+ {"train_lr": 0.00019098300562504553, "train_loss": 1.0011626567053071, "epoch": 80, "test_loss": 1.0583415099650697, "test_acc1": 73.586, "test_acc5": 91.476}
82
+ {"train_lr": 0.00017291942572544524, "train_loss": 1.0000380077721165, "epoch": 81, "test_loss": 1.0571664700003536, "test_acc1": 73.58, "test_acc5": 91.506}
83
+ {"train_lr": 0.0001556720744979767, "train_loss": 0.9977164441943644, "epoch": 82, "test_loss": 1.057512099976125, "test_acc1": 73.612, "test_acc5": 91.414}
84
+ {"train_lr": 0.00013925797299606019, "train_loss": 0.9957548426631637, "epoch": 83, "test_loss": 1.0571912611308305, "test_acc1": 73.654, "test_acc5": 91.464}
85
+ {"train_lr": 0.00012369331995613583, "train_loss": 0.9980447720818123, "epoch": 84, "test_loss": 1.0569140627942122, "test_acc1": 73.61, "test_acc5": 91.456}
86
+ {"train_lr": 0.00010899347581163435, "train_loss": 0.9969114293777795, "epoch": 85, "test_loss": 1.0565736161549684, "test_acc1": 73.602, "test_acc5": 91.47}
87
+ {"train_lr": 9.5172947533978e-05, "train_loss": 0.9945580941162441, "epoch": 86, "test_loss": 1.0560973775966087, "test_acc1": 73.64, "test_acc5": 91.476}
88
+ {"train_lr": 8.224537431602316e-05, "train_loss": 0.994675159487089, "epoch": 87, "test_loss": 1.055381961871901, "test_acc1": 73.694, "test_acc5": 91.504}
89
+ {"train_lr": 7.022351411175157e-05, "train_loss": 0.9932723817316189, "epoch": 88, "test_loss": 1.0556020966881072, "test_acc1": 73.664, "test_acc5": 91.48}
90
+ {"train_lr": 5.911923104577377e-05, "train_loss": 0.9933186636131095, "epoch": 89, "test_loss": 1.055350568745752, "test_acc1": 73.712, "test_acc5": 91.504}
91
+ {"train_lr": 4.8943483704848814e-05, "train_loss": 0.9938351032474829, "epoch": 90, "test_loss": 1.0547151328505153, "test_acc1": 73.714, "test_acc5": 91.446}
92
+ {"train_lr": 3.9706314323055196e-05, "train_loss": 0.9929382880622036, "epoch": 91, "test_loss": 1.0548186343344277, "test_acc1": 73.646, "test_acc5": 91.472}
93
+ {"train_lr": 3.141683887136792e-05, "train_loss": 0.9906537165665121, "epoch": 92, "test_loss": 1.0548451073334346, "test_acc1": 73.694, "test_acc5": 91.456}
94
+ {"train_lr": 2.4083238061252423e-05, "train_loss": 0.9911015109031428, "epoch": 93, "test_loss": 1.054458876933588, "test_acc1": 73.686, "test_acc5": 91.492}
95
+ {"train_lr": 1.7712749271312274e-05, "train_loss": 0.99034569661021, "epoch": 94, "test_loss": 1.0542710842683798, "test_acc1": 73.694, "test_acc5": 91.482}
96
+ {"train_lr": 1.2311659404861753e-05, "train_loss": 0.9884893892111895, "epoch": 95, "test_loss": 1.0543858788126266, "test_acc1": 73.704, "test_acc5": 91.486}
97
+ {"train_lr": 7.885298685522277e-06, "train_loss": 0.9893691723067142, "epoch": 96, "test_loss": 1.0543649547621416, "test_acc1": 73.726, "test_acc5": 91.482}
98
+ {"train_lr": 4.4380353969200165e-06, "train_loss": 0.9903206042364936, "epoch": 97, "test_loss": 1.0544435060999888, "test_acc1": 73.714, "test_acc5": 91.494}
99
+ {"train_lr": 1.9732715717283947e-06, "train_loss": 0.9900679454516993, "epoch": 98, "test_loss": 1.054438585972847, "test_acc1": 73.714, "test_acc5": 91.494}
100
+ {"train_lr": 4.934396342684219e-07, "train_loss": 0.9899225742178491, "epoch": 99, "test_loss": 1.0544470076823174, "test_acc1": 73.71, "test_acc5": 91.496}