Upload exp_phase8_bridge_recipeABC_KDproper_205153/log.jsonl with huggingface_hub
Browse files
exp_phase8_bridge_recipeABC_KDproper_205153/log.jsonl
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{"step": 0, "loss": 1.5086474418640137, "loss_mdlm": 1.3096985816955566, "loss_lm": 1.9894880056381226, "loss_ct": 0.0, "lr": 0.0, "gnorm": 1.5714740753173828, "bridge_gate_avg": 1.0, "bridge_out_proj_avg": 0.0, "elapsed_s": 3.3296854496002197}
|
| 2 |
+
{"step": 100, "loss": 1.466424822807312, "loss_mdlm": 1.3505407571792603, "loss_lm": 1.1588404178619385, "loss_ct": 0.0, "lr": 2.5e-05, "gnorm": 0.7537240982055664, "bridge_gate_avg": 1.000937432050705, "bridge_out_proj_avg": 0.0004454420050024055, "elapsed_s": 39.330148220062256}
|
| 3 |
+
{"step": 200, "loss": 1.428380012512207, "loss_mdlm": 1.279985785484314, "loss_lm": 1.4839422702789307, "loss_ct": 0.0, "lr": 5e-05, "gnorm": 0.8284399509429932, "bridge_gate_avg": 1.00360506772995, "bridge_out_proj_avg": 0.001611868035979569, "elapsed_s": 73.3454532623291}
|
| 4 |
+
{"step": 300, "loss": 1.3763195276260376, "loss_mdlm": 1.3093442916870117, "loss_lm": 0.6697518825531006, "loss_ct": 0.0, "lr": 4.962019382530521e-05, "gnorm": 0.5907763838768005, "bridge_gate_avg": 1.0042156875133514, "bridge_out_proj_avg": 0.0018374014471191913, "elapsed_s": 106.25103831291199}
|