Mistral-EN-Finetuned / trainer_log.jsonl
SamChen888's picture
Upload folder using huggingface_hub
593f745 verified
{"current_steps": 10, "total_steps": 348, "loss": 0.2134, "lr": 2.9938918800982563e-05, "epoch": 0.08602150537634409, "percentage": 2.87, "elapsed_time": "0:01:43", "remaining_time": "0:58:21"}
{"current_steps": 20, "total_steps": 348, "loss": 0.0692, "lr": 2.975617265898004e-05, "epoch": 0.17204301075268819, "percentage": 5.75, "elapsed_time": "0:03:24", "remaining_time": "0:56:01"}
{"current_steps": 30, "total_steps": 348, "loss": 0.0594, "lr": 2.9453249887788343e-05, "epoch": 0.25806451612903225, "percentage": 8.62, "elapsed_time": "0:05:08", "remaining_time": "0:54:24"}
{"current_steps": 40, "total_steps": 348, "loss": 0.0546, "lr": 2.9032617538884018e-05, "epoch": 0.34408602150537637, "percentage": 11.49, "elapsed_time": "0:06:51", "remaining_time": "0:52:48"}
{"current_steps": 50, "total_steps": 348, "loss": 0.0511, "lr": 2.84977013093626e-05, "epoch": 0.43010752688172044, "percentage": 14.37, "elapsed_time": "0:08:33", "remaining_time": "0:50:59"}
{"current_steps": 60, "total_steps": 348, "loss": 0.0516, "lr": 2.7852857642513838e-05, "epoch": 0.5161290322580645, "percentage": 17.24, "elapsed_time": "0:10:15", "remaining_time": "0:49:12"}
{"current_steps": 70, "total_steps": 348, "loss": 0.0464, "lr": 2.7103338248251055e-05, "epoch": 0.6021505376344086, "percentage": 20.11, "elapsed_time": "0:11:57", "remaining_time": "0:47:31"}
{"current_steps": 80, "total_steps": 348, "loss": 0.045, "lr": 2.6255247332346036e-05, "epoch": 0.6881720430107527, "percentage": 22.99, "elapsed_time": "0:13:40", "remaining_time": "0:45:49"}
{"current_steps": 90, "total_steps": 348, "loss": 0.0478, "lr": 2.531549188280135e-05, "epoch": 0.7741935483870968, "percentage": 25.86, "elapsed_time": "0:15:23", "remaining_time": "0:44:08"}
{"current_steps": 100, "total_steps": 348, "loss": 0.0397, "lr": 2.4291725418235848e-05, "epoch": 0.8602150537634409, "percentage": 28.74, "elapsed_time": "0:17:06", "remaining_time": "0:42:24"}
{"current_steps": 110, "total_steps": 348, "loss": 0.0362, "lr": 2.3192285656405456e-05, "epoch": 0.946236559139785, "percentage": 31.61, "elapsed_time": "0:18:47", "remaining_time": "0:40:39"}
{"current_steps": 120, "total_steps": 348, "loss": 0.0428, "lr": 2.2026126610496852e-05, "epoch": 1.032258064516129, "percentage": 34.48, "elapsed_time": "0:20:27", "remaining_time": "0:38:52"}
{"current_steps": 130, "total_steps": 348, "loss": 0.0334, "lr": 2.0802745666212592e-05, "epoch": 1.118279569892473, "percentage": 37.36, "elapsed_time": "0:22:11", "remaining_time": "0:37:13"}
{"current_steps": 140, "total_steps": 348, "loss": 0.035, "lr": 1.953210623354359e-05, "epoch": 1.2043010752688172, "percentage": 40.23, "elapsed_time": "0:23:54", "remaining_time": "0:35:30"}
{"current_steps": 150, "total_steps": 348, "loss": 0.0352, "lr": 1.8224556603165363e-05, "epoch": 1.2903225806451613, "percentage": 43.1, "elapsed_time": "0:25:34", "remaining_time": "0:33:45"}
{"current_steps": 160, "total_steps": 348, "loss": 0.0364, "lr": 1.689074566830434e-05, "epoch": 1.3763440860215055, "percentage": 45.98, "elapsed_time": "0:27:16", "remaining_time": "0:32:02"}
{"current_steps": 170, "total_steps": 348, "loss": 0.0332, "lr": 1.5541536198449044e-05, "epoch": 1.4623655913978495, "percentage": 48.85, "elapsed_time": "0:28:59", "remaining_time": "0:30:20"}
{"current_steps": 180, "total_steps": 348, "loss": 0.0315, "lr": 1.4187916371218739e-05, "epoch": 1.5483870967741935, "percentage": 51.72, "elapsed_time": "0:30:41", "remaining_time": "0:28:38"}
{"current_steps": 190, "total_steps": 348, "loss": 0.0312, "lr": 1.2840910282888211e-05, "epoch": 1.6344086021505375, "percentage": 54.6, "elapsed_time": "0:32:22", "remaining_time": "0:26:55"}
{"current_steps": 200, "total_steps": 348, "loss": 0.0324, "lr": 1.1511488166385349e-05, "epoch": 1.7204301075268817, "percentage": 57.47, "elapsed_time": "0:34:04", "remaining_time": "0:25:13"}
{"current_steps": 210, "total_steps": 348, "loss": 0.0326, "lr": 1.0210477047960303e-05, "epoch": 1.8064516129032258, "percentage": 60.34, "elapsed_time": "0:35:48", "remaining_time": "0:23:31"}
{"current_steps": 220, "total_steps": 348, "loss": 0.0319, "lr": 8.948472570152874e-06, "epoch": 1.89247311827957, "percentage": 63.22, "elapsed_time": "0:37:30", "remaining_time": "0:21:49"}
{"current_steps": 230, "total_steps": 348, "loss": 0.0319, "lr": 7.735752699185711e-06, "epoch": 1.978494623655914, "percentage": 66.09, "elapsed_time": "0:39:11", "remaining_time": "0:20:06"}
{"current_steps": 240, "total_steps": 348, "loss": 0.0247, "lr": 6.582194019564266e-06, "epoch": 2.064516129032258, "percentage": 68.97, "elapsed_time": "0:40:52", "remaining_time": "0:18:23"}
{"current_steps": 250, "total_steps": 348, "loss": 0.0276, "lr": 5.497191297593647e-06, "epoch": 2.150537634408602, "percentage": 71.84, "elapsed_time": "0:42:35", "remaining_time": "0:16:41"}
{"current_steps": 260, "total_steps": 348, "loss": 0.0259, "lr": 4.4895809688998655e-06, "epoch": 2.236559139784946, "percentage": 74.71, "elapsed_time": "0:44:20", "remaining_time": "0:15:00"}
{"current_steps": 270, "total_steps": 348, "loss": 0.0213, "lr": 3.567569173085455e-06, "epoch": 2.3225806451612905, "percentage": 77.59, "elapsed_time": "0:46:01", "remaining_time": "0:13:17"}
{"current_steps": 280, "total_steps": 348, "loss": 0.0224, "lr": 2.7386649216166233e-06, "epoch": 2.4086021505376345, "percentage": 80.46, "elapsed_time": "0:47:46", "remaining_time": "0:11:36"}
{"current_steps": 290, "total_steps": 348, "loss": 0.0253, "lr": 2.0096189432334194e-06, "epoch": 2.4946236559139785, "percentage": 83.33, "elapsed_time": "0:49:27", "remaining_time": "0:09:53"}
{"current_steps": 300, "total_steps": 348, "loss": 0.0241, "lr": 1.3863687049356465e-06, "epoch": 2.5806451612903225, "percentage": 86.21, "elapsed_time": "0:51:10", "remaining_time": "0:08:11"}
{"current_steps": 310, "total_steps": 348, "loss": 0.0268, "lr": 8.7399005630238e-07, "epoch": 2.6666666666666665, "percentage": 89.08, "elapsed_time": "0:52:52", "remaining_time": "0:06:28"}
{"current_steps": 320, "total_steps": 348, "loss": 0.0222, "lr": 4.766558909615504e-07, "epoch": 2.752688172043011, "percentage": 91.95, "elapsed_time": "0:54:33", "remaining_time": "0:04:46"}
{"current_steps": 330, "total_steps": 348, "loss": 0.0265, "lr": 1.9760216187710788e-07, "epoch": 2.838709677419355, "percentage": 94.83, "elapsed_time": "0:56:15", "remaining_time": "0:03:04"}
{"current_steps": 340, "total_steps": 348, "loss": 0.0242, "lr": 3.910152723075322e-08, "epoch": 2.924731182795699, "percentage": 97.7, "elapsed_time": "0:57:57", "remaining_time": "0:01:21"}
{"current_steps": 348, "total_steps": 348, "epoch": 2.9935483870967743, "percentage": 100.0, "elapsed_time": "0:59:20", "remaining_time": "0:00:00"}