explcre commited on
Commit
ba67233
·
verified ·
1 Parent(s): 8583d45

Upload exp_phase5_stage_a_v7_reasoning_t2_r128_FIXED_20260505_193938/log.jsonl with huggingface_hub

Browse files
exp_phase5_stage_a_v7_reasoning_t2_r128_FIXED_20260505_193938/log.jsonl CHANGED
@@ -11,3 +11,140 @@
11
  {"step": 220, "loss": 0.9342570304870605, "elapsed_s": 63.89808368682861}
12
  {"step": 240, "loss": 1.1639739274978638, "elapsed_s": 69.15105271339417}
13
  {"step": 260, "loss": 0.9906618595123291, "elapsed_s": 74.28221917152405}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
11
  {"step": 220, "loss": 0.9342570304870605, "elapsed_s": 63.89808368682861}
12
  {"step": 240, "loss": 1.1639739274978638, "elapsed_s": 69.15105271339417}
13
  {"step": 260, "loss": 0.9906618595123291, "elapsed_s": 74.28221917152405}
14
+ {"step": 280, "loss": 0.9217384457588196, "elapsed_s": 79.52862787246704}
15
+ {"step": 300, "loss": 1.0134793519973755, "elapsed_s": 84.66254329681396}
16
+ {"step": 320, "loss": 0.9703929424285889, "elapsed_s": 89.68356895446777}
17
+ {"step": 340, "loss": 0.934944748878479, "elapsed_s": 94.81912326812744}
18
+ {"step": 360, "loss": 1.0074201822280884, "elapsed_s": 99.89717555046082}
19
+ {"step": 380, "loss": 0.6672135591506958, "elapsed_s": 104.99657034873962}
20
+ {"step": 400, "loss": 1.0285619497299194, "elapsed_s": 110.19235754013062}
21
+ {"step": 420, "loss": 0.7391230463981628, "elapsed_s": 115.4782772064209}
22
+ {"step": 440, "loss": 0.841978907585144, "elapsed_s": 120.51270604133606}
23
+ {"step": 460, "loss": 1.0560815334320068, "elapsed_s": 125.65765833854675}
24
+ {"step": 480, "loss": 0.6530693173408508, "elapsed_s": 130.65622186660767}
25
+ {"step": 500, "loss": 0.7006113529205322, "elapsed_s": 135.74453568458557}
26
+ {"step": 520, "loss": 0.8912713527679443, "elapsed_s": 140.99209880828857}
27
+ {"step": 540, "loss": 0.8923031687736511, "elapsed_s": 146.01203083992004}
28
+ {"step": 560, "loss": 0.7651110291481018, "elapsed_s": 151.10123348236084}
29
+ {"step": 580, "loss": 0.8456388711929321, "elapsed_s": 156.1442632675171}
30
+ {"step": 600, "loss": 0.5726004838943481, "elapsed_s": 161.09750866889954}
31
+ {"step": 620, "loss": 0.7869890928268433, "elapsed_s": 166.1252555847168}
32
+ {"step": 640, "loss": 0.6021872162818909, "elapsed_s": 171.1144254207611}
33
+ {"step": 660, "loss": 0.7394794821739197, "elapsed_s": 176.17365884780884}
34
+ {"step": 680, "loss": 0.6975713968276978, "elapsed_s": 181.4919183254242}
35
+ {"step": 700, "loss": 0.6365028023719788, "elapsed_s": 186.3664162158966}
36
+ {"step": 720, "loss": 0.9330570101737976, "elapsed_s": 191.32875537872314}
37
+ {"step": 740, "loss": 0.8374877572059631, "elapsed_s": 196.4091992378235}
38
+ {"step": 760, "loss": 0.7793827056884766, "elapsed_s": 201.38521718978882}
39
+ {"step": 780, "loss": 0.604881227016449, "elapsed_s": 206.31816792488098}
40
+ {"step": 800, "loss": 0.886054515838623, "elapsed_s": 211.34451532363892}
41
+ {"step": 820, "loss": 0.7571917176246643, "elapsed_s": 216.3378665447235}
42
+ {"step": 840, "loss": 0.8188043832778931, "elapsed_s": 221.21401405334473}
43
+ {"step": 860, "loss": 0.5729079842567444, "elapsed_s": 226.2276954650879}
44
+ {"step": 880, "loss": 0.7704076170921326, "elapsed_s": 231.11284494400024}
45
+ {"step": 900, "loss": 0.5692376494407654, "elapsed_s": 235.97811269760132}
46
+ {"step": 920, "loss": 0.902776300907135, "elapsed_s": 240.82952046394348}
47
+ {"step": 940, "loss": 0.6443384289741516, "elapsed_s": 245.81543111801147}
48
+ {"step": 960, "loss": 0.6292765736579895, "elapsed_s": 250.68277168273926}
49
+ {"step": 980, "loss": 0.6460203528404236, "elapsed_s": 255.5410816669464}
50
+ {"step": 1000, "loss": 0.690719723701477, "elapsed_s": 260.4375681877136}
51
+ {"step": 1020, "loss": 0.8257105350494385, "elapsed_s": 265.3406116962433}
52
+ {"step": 1040, "loss": 0.8443910479545593, "elapsed_s": 270.2501883506775}
53
+ {"step": 1060, "loss": 0.9427888989448547, "elapsed_s": 274.97527503967285}
54
+ {"step": 1080, "loss": 0.6492099165916443, "elapsed_s": 279.78276920318604}
55
+ {"step": 1100, "loss": 0.7547662854194641, "elapsed_s": 284.7539110183716}
56
+ {"step": 1120, "loss": 0.7964253425598145, "elapsed_s": 289.51826453208923}
57
+ {"step": 1140, "loss": 0.5524964928627014, "elapsed_s": 294.37365674972534}
58
+ {"step": 1160, "loss": 0.7119346261024475, "elapsed_s": 299.2078764438629}
59
+ {"step": 1180, "loss": 0.6448314189910889, "elapsed_s": 304.03602147102356}
60
+ {"step": 1200, "loss": 0.9455552697181702, "elapsed_s": 308.9580409526825}
61
+ {"step": 1220, "loss": 0.514221727848053, "elapsed_s": 313.68317890167236}
62
+ {"step": 1240, "loss": 0.8191384077072144, "elapsed_s": 318.56613516807556}
63
+ {"step": 1260, "loss": 0.7116103768348694, "elapsed_s": 323.33849143981934}
64
+ {"step": 1280, "loss": 0.3450673222541809, "elapsed_s": 328.32604789733887}
65
+ {"step": 1300, "loss": 0.646104633808136, "elapsed_s": 333.17261838912964}
66
+ {"step": 1320, "loss": 0.7678859233856201, "elapsed_s": 337.98112058639526}
67
+ {"step": 1340, "loss": 0.7468214631080627, "elapsed_s": 342.98217272758484}
68
+ {"step": 1360, "loss": 0.6010539531707764, "elapsed_s": 347.7629635334015}
69
+ {"step": 1380, "loss": 0.42219147086143494, "elapsed_s": 352.5723373889923}
70
+ {"step": 1400, "loss": 0.7000728249549866, "elapsed_s": 357.35963773727417}
71
+ {"step": 1420, "loss": 0.44703811407089233, "elapsed_s": 362.2910363674164}
72
+ {"step": 1440, "loss": 0.7499022483825684, "elapsed_s": 367.2216486930847}
73
+ {"step": 1460, "loss": 0.4872989356517792, "elapsed_s": 372.018043756485}
74
+ {"step": 1480, "loss": 0.785200834274292, "elapsed_s": 376.82967615127563}
75
+ {"step": 1500, "loss": 0.7409285306930542, "elapsed_s": 381.59858679771423}
76
+ {"step": 1520, "loss": 0.5835148096084595, "elapsed_s": 386.50145411491394}
77
+ {"step": 1540, "loss": 0.5633326768875122, "elapsed_s": 391.41010093688965}
78
+ {"step": 1560, "loss": 0.5728590488433838, "elapsed_s": 396.1072106361389}
79
+ {"step": 1580, "loss": 0.7403851747512817, "elapsed_s": 400.9511921405792}
80
+ {"step": 1600, "loss": 0.6663960218429565, "elapsed_s": 405.6753566265106}
81
+ {"step": 1620, "loss": 0.6360340714454651, "elapsed_s": 410.7599458694458}
82
+ {"step": 1640, "loss": 0.8170230984687805, "elapsed_s": 415.5339388847351}
83
+ {"step": 1660, "loss": 0.47957849502563477, "elapsed_s": 420.41765427589417}
84
+ {"step": 1680, "loss": 0.5263388156890869, "elapsed_s": 425.08281326293945}
85
+ {"step": 1700, "loss": 0.7186670899391174, "elapsed_s": 429.9818768501282}
86
+ {"step": 1720, "loss": 0.6396377086639404, "elapsed_s": 434.89931654930115}
87
+ {"step": 1740, "loss": 0.7117732167243958, "elapsed_s": 439.65157318115234}
88
+ {"step": 1760, "loss": 0.6532768607139587, "elapsed_s": 444.43253207206726}
89
+ {"step": 1780, "loss": 0.5249560475349426, "elapsed_s": 449.24021005630493}
90
+ {"step": 1800, "loss": 0.776771068572998, "elapsed_s": 454.2873365879059}
91
+ {"step": 1820, "loss": 0.698784589767456, "elapsed_s": 459.029944896698}
92
+ {"step": 1840, "loss": 0.6735374927520752, "elapsed_s": 463.77927827835083}
93
+ {"step": 1860, "loss": 0.6430699229240417, "elapsed_s": 468.546804189682}
94
+ {"step": 1880, "loss": 0.5950252413749695, "elapsed_s": 473.2620642185211}
95
+ {"step": 1900, "loss": 0.8065794110298157, "elapsed_s": 478.14286160469055}
96
+ {"step": 1920, "loss": 0.6855514049530029, "elapsed_s": 482.9271614551544}
97
+ {"step": 1940, "loss": 0.5631692409515381, "elapsed_s": 487.5945448875427}
98
+ {"step": 1960, "loss": 0.7875005602836609, "elapsed_s": 492.35640025138855}
99
+ {"step": 1980, "loss": 0.690204918384552, "elapsed_s": 497.15804719924927}
100
+ {"step": 2000, "loss": 0.6040239930152893, "elapsed_s": 501.9295856952667}
101
+ {"step": 2020, "loss": 0.6380578875541687, "elapsed_s": 506.74664974212646}
102
+ {"step": 2040, "loss": 0.5394318103790283, "elapsed_s": 511.5181906223297}
103
+ {"step": 2060, "loss": 0.7548812031745911, "elapsed_s": 516.2892076969147}
104
+ {"step": 2080, "loss": 0.842311441898346, "elapsed_s": 521.0991258621216}
105
+ {"step": 2100, "loss": 0.664849042892456, "elapsed_s": 525.896852016449}
106
+ {"step": 2120, "loss": 0.7084640264511108, "elapsed_s": 530.6799962520599}
107
+ {"step": 2140, "loss": 0.5340833067893982, "elapsed_s": 535.4615280628204}
108
+ {"step": 2160, "loss": 0.5146570205688477, "elapsed_s": 540.1990118026733}
109
+ {"step": 2180, "loss": 0.6764290928840637, "elapsed_s": 544.9808127880096}
110
+ {"step": 2200, "loss": 0.7196254134178162, "elapsed_s": 549.7997944355011}
111
+ {"step": 2220, "loss": 0.663967490196228, "elapsed_s": 554.6405785083771}
112
+ {"step": 2240, "loss": 0.5817448496818542, "elapsed_s": 559.393562078476}
113
+ {"step": 2260, "loss": 0.6752156019210815, "elapsed_s": 564.1076827049255}
114
+ {"step": 2280, "loss": 0.7756117582321167, "elapsed_s": 568.8703010082245}
115
+ {"step": 2300, "loss": 0.8056526184082031, "elapsed_s": 573.7152421474457}
116
+ {"step": 2320, "loss": 0.7155594229698181, "elapsed_s": 578.5602447986603}
117
+ {"step": 2340, "loss": 0.5922985076904297, "elapsed_s": 583.4288778305054}
118
+ {"step": 2360, "loss": 0.6393532752990723, "elapsed_s": 588.172794342041}
119
+ {"step": 2380, "loss": 0.680176854133606, "elapsed_s": 592.9839241504669}
120
+ {"step": 2400, "loss": 0.48348119854927063, "elapsed_s": 597.7881705760956}
121
+ {"step": 2420, "loss": 0.7194271087646484, "elapsed_s": 602.5470266342163}
122
+ {"step": 2440, "loss": 0.3756081759929657, "elapsed_s": 607.312563419342}
123
+ {"step": 2460, "loss": 0.6777275204658508, "elapsed_s": 612.092348575592}
124
+ {"step": 2480, "loss": 0.7009856104850769, "elapsed_s": 616.8879475593567}
125
+ {"step": 2500, "loss": 0.6018471121788025, "elapsed_s": 621.657110452652}
126
+ {"step": 2520, "loss": 0.6428532004356384, "elapsed_s": 626.4403429031372}
127
+ {"step": 2540, "loss": 0.5736479163169861, "elapsed_s": 631.2488265037537}
128
+ {"step": 2560, "loss": 0.5846017599105835, "elapsed_s": 635.997076511383}
129
+ {"step": 2580, "loss": 0.521944522857666, "elapsed_s": 640.8334317207336}
130
+ {"step": 2600, "loss": 0.381876677274704, "elapsed_s": 645.5900771617889}
131
+ {"step": 2620, "loss": 0.4446439743041992, "elapsed_s": 650.3797936439514}
132
+ {"step": 2640, "loss": 0.5909258127212524, "elapsed_s": 655.1421356201172}
133
+ {"step": 2660, "loss": 0.7309444546699524, "elapsed_s": 659.8624119758606}
134
+ {"step": 2680, "loss": 0.6599928140640259, "elapsed_s": 664.6286828517914}
135
+ {"step": 2700, "loss": 0.6313130855560303, "elapsed_s": 669.4205410480499}
136
+ {"step": 2720, "loss": 0.5966728329658508, "elapsed_s": 674.1117067337036}
137
+ {"step": 2740, "loss": 0.5969704985618591, "elapsed_s": 678.9011998176575}
138
+ {"step": 2760, "loss": 0.5524131655693054, "elapsed_s": 683.6077523231506}
139
+ {"step": 2780, "loss": 0.656955361366272, "elapsed_s": 688.2720732688904}
140
+ {"step": 2800, "loss": 0.5542805194854736, "elapsed_s": 693.0075232982635}
141
+ {"step": 2820, "loss": 0.7230316400527954, "elapsed_s": 697.7881722450256}
142
+ {"step": 2840, "loss": 0.6691194176673889, "elapsed_s": 702.5299088954926}
143
+ {"step": 2860, "loss": 0.37612462043762207, "elapsed_s": 707.2653095722198}
144
+ {"step": 2880, "loss": 0.6314190626144409, "elapsed_s": 712.0567135810852}
145
+ {"step": 2900, "loss": 0.5167427062988281, "elapsed_s": 716.8392879962921}
146
+ {"step": 2920, "loss": 0.5582223534584045, "elapsed_s": 721.4655737876892}
147
+ {"step": 2940, "loss": 0.6079427003860474, "elapsed_s": 726.1486926078796}
148
+ {"step": 2960, "loss": 0.5880207419395447, "elapsed_s": 730.9058756828308}
149
+ {"step": 2980, "loss": 0.47934576869010925, "elapsed_s": 735.6948935985565}
150
+ {"step": 3000, "loss": 0.6230853796005249, "elapsed_s": 740.4467792510986}