Models_Ouput2 / trainer_log.jsonl
youssefedweqd's picture
Model save
ae530ba verified
{"current_steps": 16450, "total_steps": 18120, "loss": 0.2751, "lr": 2.5682530093579626e-06, "epoch": 2.7235099337748343, "percentage": 90.78, "elapsed_time": "0:05:13", "remaining_time": "0:00:31"}
{"current_steps": 16500, "total_steps": 18120, "loss": 0.2741, "lr": 2.418089536248769e-06, "epoch": 2.7317880794701987, "percentage": 91.06, "elapsed_time": "0:10:04", "remaining_time": "0:00:59"}
{"current_steps": 16550, "total_steps": 18120, "loss": 0.2772, "lr": 2.2723405158236455e-06, "epoch": 2.7400662251655628, "percentage": 91.34, "elapsed_time": "0:15:23", "remaining_time": "0:01:27"}
{"current_steps": 16600, "total_steps": 18120, "loss": 0.2715, "lr": 2.1310194700733697e-06, "epoch": 2.748344370860927, "percentage": 91.61, "elapsed_time": "0:20:25", "remaining_time": "0:01:52"}
{"current_steps": 16650, "total_steps": 18120, "loss": 0.2712, "lr": 1.9941395101795655e-06, "epoch": 2.756622516556291, "percentage": 91.89, "elapsed_time": "0:25:52", "remaining_time": "0:02:17"}
{"current_steps": 16700, "total_steps": 18120, "loss": 0.2758, "lr": 1.861713335298282e-06, "epoch": 2.7649006622516556, "percentage": 92.16, "elapsed_time": "0:31:10", "remaining_time": "0:02:39"}
{"current_steps": 16750, "total_steps": 18120, "loss": 0.2786, "lr": 1.7337532313818294e-06, "epoch": 2.77317880794702, "percentage": 92.44, "elapsed_time": "0:36:15", "remaining_time": "0:02:57"}
{"current_steps": 16800, "total_steps": 18120, "loss": 0.272, "lr": 1.6102710700389656e-06, "epoch": 2.781456953642384, "percentage": 92.72, "elapsed_time": "0:41:45", "remaining_time": "0:03:16"}
{"current_steps": 16850, "total_steps": 18120, "loss": 0.2839, "lr": 1.4912783074334469e-06, "epoch": 2.789735099337748, "percentage": 92.99, "elapsed_time": "0:46:53", "remaining_time": "0:03:32"}
{"current_steps": 16900, "total_steps": 18120, "loss": 0.2756, "lr": 1.3767859832212016e-06, "epoch": 2.7980132450331126, "percentage": 93.27, "elapsed_time": "0:52:15", "remaining_time": "0:03:46"}
{"current_steps": 16950, "total_steps": 18120, "loss": 0.2747, "lr": 1.2668047195261379e-06, "epoch": 2.806291390728477, "percentage": 93.54, "elapsed_time": "0:58:18", "remaining_time": "0:04:01"}
{"current_steps": 17000, "total_steps": 18120, "loss": 0.2707, "lr": 1.1613447199546158e-06, "epoch": 2.814569536423841, "percentage": 93.82, "elapsed_time": "1:03:32", "remaining_time": "0:04:11"}
{"current_steps": 17050, "total_steps": 18120, "loss": 0.2702, "lr": 1.0604157686488313e-06, "epoch": 2.8228476821192054, "percentage": 94.09, "elapsed_time": "1:08:49", "remaining_time": "0:04:19"}
{"current_steps": 17100, "total_steps": 18120, "loss": 0.2721, "lr": 9.640272293790998e-07, "epoch": 2.8311258278145695, "percentage": 94.37, "elapsed_time": "1:14:28", "remaining_time": "0:04:26"}
{"current_steps": 17150, "total_steps": 18120, "loss": 0.2734, "lr": 8.721880446750708e-07, "epoch": 2.839403973509934, "percentage": 94.65, "elapsed_time": "1:19:42", "remaining_time": "0:04:30"}
{"current_steps": 17200, "total_steps": 18120, "loss": 0.2757, "lr": 7.849067349961381e-07, "epoch": 2.847682119205298, "percentage": 94.92, "elapsed_time": "1:24:42", "remaining_time": "0:04:31"}
{"current_steps": 17250, "total_steps": 18120, "loss": 0.274, "lr": 7.02191397940899e-07, "epoch": 2.8559602649006623, "percentage": 95.2, "elapsed_time": "1:29:52", "remaining_time": "0:04:31"}
{"current_steps": 17300, "total_steps": 18120, "loss": 0.2721, "lr": 6.240497074959162e-07, "epoch": 2.8642384105960264, "percentage": 95.47, "elapsed_time": "1:34:46", "remaining_time": "0:04:29"}
{"current_steps": 17350, "total_steps": 18120, "loss": 0.279, "lr": 5.504889133237656e-07, "epoch": 2.872516556291391, "percentage": 95.75, "elapsed_time": "1:40:27", "remaining_time": "0:04:27"}
{"current_steps": 17400, "total_steps": 18120, "loss": 0.2744, "lr": 4.815158400904185e-07, "epoch": 2.880794701986755, "percentage": 96.03, "elapsed_time": "1:45:31", "remaining_time": "0:04:21"}
{"current_steps": 17450, "total_steps": 18120, "loss": 0.2795, "lr": 4.1713688683208686e-07, "epoch": 2.8890728476821192, "percentage": 96.3, "elapsed_time": "1:50:38", "remaining_time": "0:04:14"}
{"current_steps": 17500, "total_steps": 18120, "loss": 0.2778, "lr": 3.573580263615539e-07, "epoch": 2.8973509933774837, "percentage": 96.58, "elapsed_time": "1:55:37", "remaining_time": "0:04:05"}
{"current_steps": 17550, "total_steps": 18120, "loss": 0.2757, "lr": 3.0218480471403965e-07, "epoch": 2.9056291390728477, "percentage": 96.85, "elapsed_time": "2:01:00", "remaining_time": "0:03:55"}
{"current_steps": 17600, "total_steps": 18120, "loss": 0.274, "lr": 2.5162234063264567e-07, "epoch": 2.9139072847682117, "percentage": 97.13, "elapsed_time": "2:06:00", "remaining_time": "0:03:43"}
{"current_steps": 17650, "total_steps": 18120, "loss": 0.2701, "lr": 2.0567532509348508e-07, "epoch": 2.922185430463576, "percentage": 97.41, "elapsed_time": "2:11:36", "remaining_time": "0:03:30"}
{"current_steps": 17700, "total_steps": 18120, "loss": 0.2693, "lr": 1.6434802087046397e-07, "epoch": 2.9304635761589406, "percentage": 97.68, "elapsed_time": "2:16:37", "remaining_time": "0:03:14"}
{"current_steps": 17750, "total_steps": 18120, "loss": 0.2637, "lr": 1.276442621397922e-07, "epoch": 2.9387417218543046, "percentage": 97.96, "elapsed_time": "2:22:29", "remaining_time": "0:02:58"}
{"current_steps": 17800, "total_steps": 18120, "loss": 0.2657, "lr": 9.556745412425683e-08, "epoch": 2.9470198675496686, "percentage": 98.23, "elapsed_time": "2:27:27", "remaining_time": "0:02:39"}
{"current_steps": 17850, "total_steps": 18120, "loss": 0.272, "lr": 6.812057277733042e-08, "epoch": 2.955298013245033, "percentage": 98.51, "elapsed_time": "2:33:03", "remaining_time": "0:02:18"}
{"current_steps": 17900, "total_steps": 18120, "loss": 0.2696, "lr": 4.530616450704184e-08, "epoch": 2.9635761589403975, "percentage": 98.79, "elapsed_time": "2:38:13", "remaining_time": "0:01:56"}
{"current_steps": 17950, "total_steps": 18120, "loss": 0.2712, "lr": 2.712634593974861e-08, "epoch": 2.9718543046357615, "percentage": 99.06, "elapsed_time": "2:43:20", "remaining_time": "0:01:32"}
{"current_steps": 18000, "total_steps": 18120, "loss": 0.2695, "lr": 1.358280372376064e-08, "epoch": 2.980132450331126, "percentage": 99.34, "elapsed_time": "2:48:21", "remaining_time": "0:01:07"}
{"current_steps": 18050, "total_steps": 18120, "loss": 0.277, "lr": 4.6767943728598386e-09, "epoch": 2.98841059602649, "percentage": 99.61, "elapsed_time": "2:53:10", "remaining_time": "0:00:40"}
{"current_steps": 18100, "total_steps": 18120, "loss": 0.2837, "lr": 4.091441497322546e-10, "epoch": 2.9966887417218544, "percentage": 99.89, "elapsed_time": "2:58:23", "remaining_time": "0:00:11"}
{"current_steps": 18120, "total_steps": 18120, "eval_loss": 0.3766781985759735, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "3:52:54", "remaining_time": "0:00:00"}
{"current_steps": 18120, "total_steps": 18120, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "3:52:54", "remaining_time": "0:00:00"}