explcre commited on
Commit
afde56e
·
verified ·
1 Parent(s): 16f0667

Upload exp_phase8_bridge_recipeABC_300step_035043/log.jsonl with huggingface_hub

Browse files
exp_phase8_bridge_recipeABC_300step_035043/log.jsonl ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"step": 0, "loss": 2.2810750007629395, "loss_mdlm": 1.3196226358413696, "loss_lm": 1.9229048490524292, "loss_ct": 0.0, "lr": 0.0, "gnorm": 6.22329044342041, "bridge_gate_avg": 1.0, "bridge_out_proj_avg": 0.0, "elapsed_s": 3.5541374683380127}
2
+ {"step": 25, "loss": 1.4694701433181763, "loss_mdlm": 0.7427740097045898, "loss_lm": 1.4533922672271729, "loss_ct": 0.0, "lr": 4.166666666666667e-05, "gnorm": 2.6370227336883545, "bridge_gate_avg": 1.000319004058838, "bridge_out_proj_avg": 0.00017790815036278218, "elapsed_s": 15.706307649612427}
3
+ {"step": 50, "loss": 2.005795955657959, "loss_mdlm": 1.4064075946807861, "loss_lm": 1.1987766027450562, "loss_ct": 0.0, "lr": 4.9326121764495596e-05, "gnorm": 3.9589033126831055, "bridge_gate_avg": 1.0008048117160797, "bridge_out_proj_avg": 0.00041387030796613544, "elapsed_s": 28.02803874015808}
4
+ {"step": 75, "loss": 1.843766450881958, "loss_mdlm": 1.3427734375, "loss_lm": 1.0019859075546265, "loss_ct": 0.0, "lr": 4.665063509461097e-05, "gnorm": 3.244795799255371, "bridge_gate_avg": 1.001827359199524, "bridge_out_proj_avg": 0.0008815678738756105, "elapsed_s": 40.26014590263367}
5
+ {"step": 100, "loss": 1.8309361934661865, "loss_mdlm": 1.3361928462982178, "loss_lm": 0.989486813545227, "loss_ct": 0.0, "lr": 4.215604094671835e-05, "gnorm": 3.332274913787842, "bridge_gate_avg": 1.002499520778656, "bridge_out_proj_avg": 0.001246427942533046, "elapsed_s": 52.17511534690857}
6
+ {"step": 125, "loss": 1.835036039352417, "loss_mdlm": 1.3302626609802246, "loss_lm": 1.0095466375350952, "loss_ct": 0.0, "lr": 3.621997950501156e-05, "gnorm": 3.2755086421966553, "bridge_gate_avg": 1.0026077628135681, "bridge_out_proj_avg": 0.00134880215045996, "elapsed_s": 64.07104277610779}
7
+ {"step": 150, "loss": 1.8255870342254639, "loss_mdlm": 1.3208285570144653, "loss_lm": 1.0095168352127075, "loss_ct": 0.0, "lr": 2.9341204441673266e-05, "gnorm": 3.2750401496887207, "bridge_gate_avg": 1.00302454829216, "bridge_out_proj_avg": 0.0015377872623503208, "elapsed_s": 76.05668926239014}
8
+ {"step": 175, "loss": 1.7289721965789795, "loss_mdlm": 1.3014837503433228, "loss_lm": 0.8549769520759583, "loss_ct": 0.0, "lr": 2.2097677146869242e-05, "gnorm": 3.160585403442383, "bridge_gate_avg": 1.0033977329730988, "bridge_out_proj_avg": 0.0016631950857117772, "elapsed_s": 87.88038611412048}
9
+ {"step": 200, "loss": 2.059060573577881, "loss_mdlm": 1.3455456495285034, "loss_lm": 1.4270298480987549, "loss_ct": 0.0, "lr": 1.509800584902108e-05, "gnorm": 3.444671154022217, "bridge_gate_avg": 1.0035595297813416, "bridge_out_proj_avg": 0.0017156197573058307, "elapsed_s": 99.72339105606079}
10
+ {"step": 225, "loss": 1.9769656658172607, "loss_mdlm": 1.339945912361145, "loss_lm": 1.274039387702942, "loss_ct": 0.0, "lr": 8.930309757836517e-06, "gnorm": 3.8006086349487305, "bridge_gate_avg": 1.0036472976207733, "bridge_out_proj_avg": 0.0017352754657622427, "elapsed_s": 111.67326998710632}
11
+ {"step": 250, "loss": 1.7251914739608765, "loss_mdlm": 1.280639410018921, "loss_lm": 0.8891040682792664, "loss_ct": 0.0, "lr": 4.112804714676594e-06, "gnorm": 3.708483934402466, "bridge_gate_avg": 1.0036917924880981, "bridge_out_proj_avg": 0.0017449887527618557, "elapsed_s": 123.5641131401062}
12
+ {"step": 275, "loss": 1.660829782485962, "loss_mdlm": 1.3798034191131592, "loss_lm": 0.562052845954895, "loss_ct": 0.0, "lr": 1.0502621921127776e-06, "gnorm": 2.5561678409576416, "bridge_gate_avg": 1.0037106573581696, "bridge_out_proj_avg": 0.0017500638496130705, "elapsed_s": 134.73223686218262}