Mistral-Nemo-Finetuned / trainer_log.jsonl
SamChen888's picture
Upload folder using huggingface_hub
06e71fe verified
{"current_steps": 10, "total_steps": 348, "loss": 0.0829, "lr": 2.9938918800982563e-05, "epoch": 0.08602150537634409, "percentage": 2.87, "elapsed_time": "0:00:54", "remaining_time": "0:30:25"}
{"current_steps": 20, "total_steps": 348, "loss": 0.073, "lr": 2.975617265898004e-05, "epoch": 0.17204301075268819, "percentage": 5.75, "elapsed_time": "0:01:44", "remaining_time": "0:28:32"}
{"current_steps": 30, "total_steps": 348, "loss": 0.068, "lr": 2.9453249887788343e-05, "epoch": 0.25806451612903225, "percentage": 8.62, "elapsed_time": "0:02:37", "remaining_time": "0:27:52"}
{"current_steps": 40, "total_steps": 348, "loss": 0.0603, "lr": 2.9032617538884018e-05, "epoch": 0.34408602150537637, "percentage": 11.49, "elapsed_time": "0:03:30", "remaining_time": "0:26:57"}
{"current_steps": 50, "total_steps": 348, "loss": 0.0617, "lr": 2.84977013093626e-05, "epoch": 0.43010752688172044, "percentage": 14.37, "elapsed_time": "0:04:22", "remaining_time": "0:26:02"}
{"current_steps": 60, "total_steps": 348, "loss": 0.0617, "lr": 2.7852857642513838e-05, "epoch": 0.5161290322580645, "percentage": 17.24, "elapsed_time": "0:05:12", "remaining_time": "0:25:01"}
{"current_steps": 70, "total_steps": 348, "loss": 0.0587, "lr": 2.7103338248251055e-05, "epoch": 0.6021505376344086, "percentage": 20.11, "elapsed_time": "0:06:03", "remaining_time": "0:24:05"}
{"current_steps": 80, "total_steps": 348, "loss": 0.0555, "lr": 2.6255247332346036e-05, "epoch": 0.6881720430107527, "percentage": 22.99, "elapsed_time": "0:06:55", "remaining_time": "0:23:12"}
{"current_steps": 90, "total_steps": 348, "loss": 0.0538, "lr": 2.531549188280135e-05, "epoch": 0.7741935483870968, "percentage": 25.86, "elapsed_time": "0:07:48", "remaining_time": "0:22:23"}
{"current_steps": 100, "total_steps": 348, "loss": 0.0466, "lr": 2.4291725418235848e-05, "epoch": 0.8602150537634409, "percentage": 28.74, "elapsed_time": "0:08:40", "remaining_time": "0:21:31"}
{"current_steps": 110, "total_steps": 348, "loss": 0.0457, "lr": 2.3192285656405456e-05, "epoch": 0.946236559139785, "percentage": 31.61, "elapsed_time": "0:09:31", "remaining_time": "0:20:36"}
{"current_steps": 120, "total_steps": 348, "loss": 0.0491, "lr": 2.2026126610496852e-05, "epoch": 1.032258064516129, "percentage": 34.48, "elapsed_time": "0:10:21", "remaining_time": "0:19:41"}
{"current_steps": 130, "total_steps": 348, "loss": 0.0421, "lr": 2.0802745666212592e-05, "epoch": 1.118279569892473, "percentage": 37.36, "elapsed_time": "0:11:14", "remaining_time": "0:18:50"}
{"current_steps": 140, "total_steps": 348, "loss": 0.0429, "lr": 1.953210623354359e-05, "epoch": 1.2043010752688172, "percentage": 40.23, "elapsed_time": "0:12:06", "remaining_time": "0:17:59"}
{"current_steps": 150, "total_steps": 348, "loss": 0.0448, "lr": 1.8224556603165363e-05, "epoch": 1.2903225806451613, "percentage": 43.1, "elapsed_time": "0:12:57", "remaining_time": "0:17:06"}
{"current_steps": 160, "total_steps": 348, "loss": 0.0439, "lr": 1.689074566830434e-05, "epoch": 1.3763440860215055, "percentage": 45.98, "elapsed_time": "0:13:49", "remaining_time": "0:16:14"}
{"current_steps": 170, "total_steps": 348, "loss": 0.0432, "lr": 1.5541536198449044e-05, "epoch": 1.4623655913978495, "percentage": 48.85, "elapsed_time": "0:14:41", "remaining_time": "0:15:23"}
{"current_steps": 180, "total_steps": 348, "loss": 0.0384, "lr": 1.4187916371218739e-05, "epoch": 1.5483870967741935, "percentage": 51.72, "elapsed_time": "0:15:34", "remaining_time": "0:14:31"}
{"current_steps": 190, "total_steps": 348, "loss": 0.0415, "lr": 1.2840910282888211e-05, "epoch": 1.6344086021505375, "percentage": 54.6, "elapsed_time": "0:16:25", "remaining_time": "0:13:39"}
{"current_steps": 200, "total_steps": 348, "loss": 0.0419, "lr": 1.1511488166385349e-05, "epoch": 1.7204301075268817, "percentage": 57.47, "elapsed_time": "0:17:18", "remaining_time": "0:12:48"}
{"current_steps": 210, "total_steps": 348, "loss": 0.0431, "lr": 1.0210477047960303e-05, "epoch": 1.8064516129032258, "percentage": 60.34, "elapsed_time": "0:18:10", "remaining_time": "0:11:56"}
{"current_steps": 220, "total_steps": 348, "loss": 0.0389, "lr": 8.948472570152874e-06, "epoch": 1.89247311827957, "percentage": 63.22, "elapsed_time": "0:19:02", "remaining_time": "0:11:04"}
{"current_steps": 230, "total_steps": 348, "loss": 0.0422, "lr": 7.735752699185711e-06, "epoch": 1.978494623655914, "percentage": 66.09, "elapsed_time": "0:19:53", "remaining_time": "0:10:12"}
{"current_steps": 240, "total_steps": 348, "loss": 0.0337, "lr": 6.582194019564266e-06, "epoch": 2.064516129032258, "percentage": 68.97, "elapsed_time": "0:20:45", "remaining_time": "0:09:20"}
{"current_steps": 250, "total_steps": 348, "loss": 0.0354, "lr": 5.497191297593647e-06, "epoch": 2.150537634408602, "percentage": 71.84, "elapsed_time": "0:21:37", "remaining_time": "0:08:28"}
{"current_steps": 260, "total_steps": 348, "loss": 0.0375, "lr": 4.4895809688998655e-06, "epoch": 2.236559139784946, "percentage": 74.71, "elapsed_time": "0:22:31", "remaining_time": "0:07:37"}
{"current_steps": 270, "total_steps": 348, "loss": 0.0296, "lr": 3.567569173085455e-06, "epoch": 2.3225806451612905, "percentage": 77.59, "elapsed_time": "0:23:22", "remaining_time": "0:06:45"}
{"current_steps": 280, "total_steps": 348, "loss": 0.0326, "lr": 2.7386649216166233e-06, "epoch": 2.4086021505376345, "percentage": 80.46, "elapsed_time": "0:24:15", "remaining_time": "0:05:53"}
{"current_steps": 290, "total_steps": 348, "loss": 0.037, "lr": 2.0096189432334194e-06, "epoch": 2.4946236559139785, "percentage": 83.33, "elapsed_time": "0:25:06", "remaining_time": "0:05:01"}
{"current_steps": 300, "total_steps": 348, "loss": 0.0344, "lr": 1.3863687049356465e-06, "epoch": 2.5806451612903225, "percentage": 86.21, "elapsed_time": "0:25:58", "remaining_time": "0:04:09"}
{"current_steps": 310, "total_steps": 348, "loss": 0.0382, "lr": 8.7399005630238e-07, "epoch": 2.6666666666666665, "percentage": 89.08, "elapsed_time": "0:26:50", "remaining_time": "0:03:17"}
{"current_steps": 320, "total_steps": 348, "loss": 0.0332, "lr": 4.766558909615504e-07, "epoch": 2.752688172043011, "percentage": 91.95, "elapsed_time": "0:27:42", "remaining_time": "0:02:25"}
{"current_steps": 330, "total_steps": 348, "loss": 0.0369, "lr": 1.9760216187710788e-07, "epoch": 2.838709677419355, "percentage": 94.83, "elapsed_time": "0:28:34", "remaining_time": "0:01:33"}
{"current_steps": 340, "total_steps": 348, "loss": 0.0361, "lr": 3.910152723075322e-08, "epoch": 2.924731182795699, "percentage": 97.7, "elapsed_time": "0:29:26", "remaining_time": "0:00:41"}
{"current_steps": 348, "total_steps": 348, "epoch": 2.9935483870967743, "percentage": 100.0, "elapsed_time": "0:30:08", "remaining_time": "0:00:00"}