Upload exp_phase5_stage_a_v7_reasoning_t1_lora_r64_20260502_074716/log.jsonl with huggingface_hub
Browse files
exp_phase5_stage_a_v7_reasoning_t1_lora_r64_20260502_074716/log.jsonl
ADDED
|
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{"step": 20, "loss": NaN, "elapsed_s": 5.731360673904419}
|
| 2 |
+
{"step": 40, "loss": NaN, "elapsed_s": 7.778916835784912}
|
| 3 |
+
{"step": 60, "loss": NaN, "elapsed_s": 9.806840896606445}
|
| 4 |
+
{"step": 80, "loss": NaN, "elapsed_s": 11.772510051727295}
|
| 5 |
+
{"step": 100, "loss": NaN, "elapsed_s": 13.802911758422852}
|
| 6 |
+
{"step": 120, "loss": 2.5295445919036865, "elapsed_s": 15.905678987503052}
|
| 7 |
+
{"step": 140, "loss": 2.0999183654785156, "elapsed_s": 18.107208728790283}
|
| 8 |
+
{"step": 160, "loss": NaN, "elapsed_s": 20.144402742385864}
|
| 9 |
+
{"step": 180, "loss": NaN, "elapsed_s": 22.249879121780396}
|
| 10 |
+
{"step": 200, "loss": 1.7266323566436768, "elapsed_s": 24.225685358047485}
|
| 11 |
+
{"step": 220, "loss": NaN, "elapsed_s": 26.267016649246216}
|
| 12 |
+
{"step": 240, "loss": 2.0112650394439697, "elapsed_s": 28.242889642715454}
|
| 13 |
+
{"step": 260, "loss": 2.4226670265197754, "elapsed_s": 30.400964975357056}
|
| 14 |
+
{"step": 280, "loss": NaN, "elapsed_s": 32.38187575340271}
|
| 15 |
+
{"step": 300, "loss": NaN, "elapsed_s": 34.420690298080444}
|
| 16 |
+
{"step": 320, "loss": 1.2426788806915283, "elapsed_s": 36.469998836517334}
|
| 17 |
+
{"step": 340, "loss": NaN, "elapsed_s": 38.53470277786255}
|