explcre commited on
Commit
0eed91d
·
verified ·
1 Parent(s): 128f419

Upload exp_phase8_through_mdlm_svgspo_20260501_030213/log.jsonl with huggingface_hub

Browse files
exp_phase8_through_mdlm_svgspo_20260501_030213/log.jsonl ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"step": 10, "loss": -0.0034270882606506348, "reward_mean": -0.06494326889514923, "elapsed_s": 307.738162279129}
2
+ {"step": 20, "loss": -0.0017684251070022583, "reward_mean": -0.012319823261350393, "elapsed_s": 614.7154757976532}
3
+ {"step": 30, "loss": -0.006462752819061279, "reward_mean": 0.13936650846153498, "elapsed_s": 922.1146523952484}
4
+ {"step": 40, "loss": 0.0013982467353343964, "reward_mean": 0.4224778562784195, "elapsed_s": 1229.8806874752045}
5
+ {"step": 50, "loss": -0.006531812250614166, "reward_mean": 0.0628681629896164, "elapsed_s": 1536.94970703125}
6
+ {"step": 60, "loss": 0.005877722054719925, "reward_mean": -0.08045199699699879, "elapsed_s": 1844.4274053573608}
7
+ {"step": 70, "loss": -0.007258661091327667, "reward_mean": -0.011964099481701851, "elapsed_s": 2150.9731233119965}
8
+ {"step": 80, "loss": 4.76837158203125e-06, "reward_mean": 0.418991032987833, "elapsed_s": 2456.610666513443}
9
+ {"step": 90, "loss": 0.0015859454870224, "reward_mean": -0.08822085335850716, "elapsed_s": 2762.6486110687256}
10
+ {"step": 100, "loss": -0.008242428302764893, "reward_mean": 0.3108661472797394, "elapsed_s": 3068.688961982727}
11
+ {"step": 110, "loss": 0.0021303370594978333, "reward_mean": 0.7970281541347504, "elapsed_s": 4255.073075771332}
12
+ {"step": 120, "loss": 0.0006234720349311829, "reward_mean": -0.010967331007122993, "elapsed_s": 4560.374354362488}
13
+ {"step": 130, "loss": 6.160140037536621e-05, "reward_mean": 0.23303482308983803, "elapsed_s": 4866.885046243668}
14
+ {"step": 140, "loss": -0.0010533034801483154, "reward_mean": -0.05029655247926712, "elapsed_s": 5169.8928463459015}
15
+ {"step": 150, "loss": 0.007994145154953003, "reward_mean": 0.23319999873638153, "elapsed_s": 5473.405427694321}
16
+ {"step": 160, "loss": -0.002621203660964966, "reward_mean": 0.34549144469201565, "elapsed_s": 5777.982485771179}
17
+ {"step": 170, "loss": -0.00040067732334136963, "reward_mean": -0.029216839000582695, "elapsed_s": 6082.830990552902}
18
+ {"step": 180, "loss": 0.0015888810157775879, "reward_mean": 0.21011998876929283, "elapsed_s": 6387.0380136966705}
19
+ {"step": 190, "loss": -0.003651760518550873, "reward_mean": -0.0850878581404686, "elapsed_s": 6690.746138334274}
20
+ {"step": 200, "loss": -0.0011408329010009766, "reward_mean": -0.04496814124286175, "elapsed_s": 6994.859612464905}
21
+ {"step": 210, "loss": -0.004734046757221222, "reward_mean": 0.2900286512449384, "elapsed_s": 8090.8769516944885}
22
+ {"step": 220, "loss": -0.000510089099407196, "reward_mean": 0.2724920017644763, "elapsed_s": 8395.732300519943}
23
+ {"step": 230, "loss": 0.0011174306273460388, "reward_mean": -0.07859226316213608, "elapsed_s": 8701.182558774948}
24
+ {"step": 240, "loss": 0.0022516995668411255, "reward_mean": -0.02631366439163685, "elapsed_s": 9004.869078159332}
25
+ {"step": 250, "loss": -0.003285124897956848, "reward_mean": -0.044884445145726204, "elapsed_s": 9308.358837604523}
26
+ {"step": 260, "loss": 0.0026149190962314606, "reward_mean": -0.07280603796243668, "elapsed_s": 9612.140971422195}
27
+ {"step": 270, "loss": 0.0011996999382972717, "reward_mean": 0.14749733405187726, "elapsed_s": 9915.645687818527}
28
+ {"step": 280, "loss": -0.002142060548067093, "reward_mean": 0.26336554950103164, "elapsed_s": 10219.908189058304}
29
+ {"step": 290, "loss": -0.0017841681838035583, "reward_mean": -0.10801009833812714, "elapsed_s": 10522.237151622772}
30
+ {"step": 300, "loss": 0.0023226141929626465, "reward_mean": 0.06800594925880432, "elapsed_s": 10827.069626808167}