Qwen2.5-7B-Multi-Question / trainer_log.jsonl
PumeTu's picture
Upload folder using huggingface_hub
e5290dd verified
{"current_steps": 10, "total_steps": 420, "loss": 0.6621, "lr": 4.761904761904762e-06, "epoch": 0.07126948775055679, "percentage": 2.38, "elapsed_time": "0:04:19", "remaining_time": "2:57:28"}
{"current_steps": 20, "total_steps": 420, "loss": 0.2856, "lr": 9.523809523809525e-06, "epoch": 0.14253897550111358, "percentage": 4.76, "elapsed_time": "0:08:24", "remaining_time": "2:48:06"}
{"current_steps": 30, "total_steps": 420, "loss": 0.2252, "lr": 1.4285714285714287e-05, "epoch": 0.21380846325167038, "percentage": 7.14, "elapsed_time": "0:12:39", "remaining_time": "2:44:30"}
{"current_steps": 40, "total_steps": 420, "loss": 0.1807, "lr": 1.904761904761905e-05, "epoch": 0.28507795100222716, "percentage": 9.52, "elapsed_time": "0:16:44", "remaining_time": "2:38:59"}
{"current_steps": 50, "total_steps": 420, "loss": 0.1351, "lr": 1.997790438338385e-05, "epoch": 0.35634743875278396, "percentage": 11.9, "elapsed_time": "0:20:47", "remaining_time": "2:33:49"}
{"current_steps": 60, "total_steps": 420, "loss": 0.0998, "lr": 1.9888308262251286e-05, "epoch": 0.42761692650334077, "percentage": 14.29, "elapsed_time": "0:25:04", "remaining_time": "2:30:28"}
{"current_steps": 70, "total_steps": 420, "loss": 0.0748, "lr": 1.973044870579824e-05, "epoch": 0.49888641425389757, "percentage": 16.67, "elapsed_time": "0:29:14", "remaining_time": "2:26:12"}
{"current_steps": 80, "total_steps": 420, "loss": 0.0531, "lr": 1.9505415489478293e-05, "epoch": 0.5701559020044543, "percentage": 19.05, "elapsed_time": "0:33:26", "remaining_time": "2:22:09"}
{"current_steps": 90, "total_steps": 420, "loss": 0.0393, "lr": 1.921476211870408e-05, "epoch": 0.6414253897550112, "percentage": 21.43, "elapsed_time": "0:37:34", "remaining_time": "2:17:46"}
{"current_steps": 100, "total_steps": 420, "loss": 0.0312, "lr": 1.8860495104301346e-05, "epoch": 0.7126948775055679, "percentage": 23.81, "elapsed_time": "0:41:58", "remaining_time": "2:14:17"}
{"current_steps": 110, "total_steps": 420, "loss": 0.0242, "lr": 1.844506011066308e-05, "epoch": 0.7839643652561247, "percentage": 26.19, "elapsed_time": "0:45:51", "remaining_time": "2:09:14"}
{"current_steps": 120, "total_steps": 420, "loss": 0.0204, "lr": 1.7971325072229227e-05, "epoch": 0.8552338530066815, "percentage": 28.57, "elapsed_time": "0:50:09", "remaining_time": "2:05:22"}
{"current_steps": 130, "total_steps": 420, "loss": 0.0177, "lr": 1.7442560394846518e-05, "epoch": 0.9265033407572383, "percentage": 30.95, "elapsed_time": "0:54:16", "remaining_time": "2:01:05"}
{"current_steps": 140, "total_steps": 420, "loss": 0.0148, "lr": 1.686241637868734e-05, "epoch": 0.9977728285077951, "percentage": 33.33, "elapsed_time": "0:58:30", "remaining_time": "1:57:01"}
{"current_steps": 150, "total_steps": 420, "loss": 0.0081, "lr": 1.6234898018587336e-05, "epoch": 1.064142538975501, "percentage": 35.71, "elapsed_time": "1:02:27", "remaining_time": "1:52:24"}
{"current_steps": 160, "total_steps": 420, "loss": 0.0069, "lr": 1.5564337355766412e-05, "epoch": 1.135412026726058, "percentage": 38.1, "elapsed_time": "1:06:42", "remaining_time": "1:48:24"}
{"current_steps": 170, "total_steps": 420, "loss": 0.0061, "lr": 1.4855363571801523e-05, "epoch": 1.2066815144766148, "percentage": 40.48, "elapsed_time": "1:10:43", "remaining_time": "1:44:00"}
{"current_steps": 180, "total_steps": 420, "loss": 0.0052, "lr": 1.4112871031306118e-05, "epoch": 1.2779510022271716, "percentage": 42.86, "elapsed_time": "1:14:48", "remaining_time": "1:39:44"}
{"current_steps": 190, "total_steps": 420, "loss": 0.0053, "lr": 1.3341985493931877e-05, "epoch": 1.3492204899777283, "percentage": 45.24, "elapsed_time": "1:18:48", "remaining_time": "1:35:24"}
{"current_steps": 200, "total_steps": 420, "loss": 0.0048, "lr": 1.2548028728946548e-05, "epoch": 1.4204899777282851, "percentage": 47.62, "elapsed_time": "1:22:58", "remaining_time": "1:31:16"}
{"current_steps": 210, "total_steps": 420, "loss": 0.0045, "lr": 1.1736481776669307e-05, "epoch": 1.4917594654788418, "percentage": 50.0, "elapsed_time": "1:27:03", "remaining_time": "1:27:03"}
{"current_steps": 220, "total_steps": 420, "loss": 0.0038, "lr": 1.0912947110386484e-05, "epoch": 1.5630289532293986, "percentage": 52.38, "elapsed_time": "1:30:57", "remaining_time": "1:22:41"}
{"current_steps": 230, "total_steps": 420, "loss": 0.0041, "lr": 1.0083109959960974e-05, "epoch": 1.6342984409799555, "percentage": 54.76, "elapsed_time": "1:35:41", "remaining_time": "1:19:03"}
{"current_steps": 240, "total_steps": 420, "loss": 0.004, "lr": 9.252699064135759e-06, "epoch": 1.7055679287305123, "percentage": 57.14, "elapsed_time": "1:39:50", "remaining_time": "1:14:52"}
{"current_steps": 250, "total_steps": 420, "loss": 0.0038, "lr": 8.427447122476148e-06, "epoch": 1.7768374164810692, "percentage": 59.52, "elapsed_time": "1:44:01", "remaining_time": "1:10:44"}
{"current_steps": 260, "total_steps": 420, "loss": 0.0039, "lr": 7.613051219968624e-06, "epoch": 1.8481069042316258, "percentage": 61.9, "elapsed_time": "1:49:16", "remaining_time": "1:07:14"}
{"current_steps": 270, "total_steps": 420, "loss": 0.0035, "lr": 6.815133497483157e-06, "epoch": 1.9193763919821827, "percentage": 64.29, "elapsed_time": "1:53:36", "remaining_time": "1:03:07"}
{"current_steps": 280, "total_steps": 420, "loss": 0.003, "lr": 6.039202339608432e-06, "epoch": 1.9906458797327393, "percentage": 66.67, "elapsed_time": "1:57:40", "remaining_time": "0:58:50"}
{"current_steps": 290, "total_steps": 420, "loss": 0.0019, "lr": 5.290614347797802e-06, "epoch": 2.057015590200445, "percentage": 69.05, "elapsed_time": "2:01:52", "remaining_time": "0:54:38"}
{"current_steps": 300, "total_steps": 420, "loss": 0.0015, "lr": 4.5745373613424075e-06, "epoch": 2.128285077951002, "percentage": 71.43, "elapsed_time": "2:06:12", "remaining_time": "0:50:28"}
{"current_steps": 310, "total_steps": 420, "loss": 0.0015, "lr": 3.89591478145437e-06, "epoch": 2.199554565701559, "percentage": 73.81, "elapsed_time": "2:10:24", "remaining_time": "0:46:16"}
{"current_steps": 320, "total_steps": 420, "loss": 0.0015, "lr": 3.2594314447468457e-06, "epoch": 2.270824053452116, "percentage": 76.19, "elapsed_time": "2:14:30", "remaining_time": "0:42:02"}
{"current_steps": 330, "total_steps": 420, "loss": 0.0014, "lr": 2.669481281701739e-06, "epoch": 2.3420935412026727, "percentage": 78.57, "elapsed_time": "2:18:47", "remaining_time": "0:37:51"}
{"current_steps": 340, "total_steps": 420, "loss": 0.0013, "lr": 2.130136983393112e-06, "epoch": 2.4133630289532295, "percentage": 80.95, "elapsed_time": "2:22:53", "remaining_time": "0:33:37"}
{"current_steps": 350, "total_steps": 420, "loss": 0.0013, "lr": 1.6451218858706374e-06, "epoch": 2.4846325167037864, "percentage": 83.33, "elapsed_time": "2:26:54", "remaining_time": "0:29:22"}
{"current_steps": 360, "total_steps": 420, "loss": 0.0014, "lr": 1.2177842662977136e-06, "epoch": 2.5559020044543432, "percentage": 85.71, "elapsed_time": "2:30:50", "remaining_time": "0:25:08"}
{"current_steps": 370, "total_steps": 420, "loss": 0.0011, "lr": 8.510742282896545e-07, "epoch": 2.6271714922048996, "percentage": 88.1, "elapsed_time": "2:34:48", "remaining_time": "0:20:55"}
{"current_steps": 380, "total_steps": 420, "loss": 0.0012, "lr": 5.475233360227516e-07, "epoch": 2.6984409799554565, "percentage": 90.48, "elapsed_time": "2:38:55", "remaining_time": "0:16:43"}
{"current_steps": 390, "total_steps": 420, "loss": 0.0012, "lr": 3.0922713770922155e-07, "epoch": 2.7697104677060134, "percentage": 92.86, "elapsed_time": "2:43:09", "remaining_time": "0:12:33"}
{"current_steps": 400, "total_steps": 420, "loss": 0.0013, "lr": 1.3783069908621772e-07, "epoch": 2.8409799554565702, "percentage": 95.24, "elapsed_time": "2:47:15", "remaining_time": "0:08:21"}
{"current_steps": 410, "total_steps": 420, "loss": 0.0014, "lr": 3.451724678784518e-08, "epoch": 2.912249443207127, "percentage": 97.62, "elapsed_time": "2:51:27", "remaining_time": "0:04:10"}
{"current_steps": 420, "total_steps": 420, "loss": 0.001, "lr": 0.0, "epoch": 2.9835189309576835, "percentage": 100.0, "elapsed_time": "2:55:42", "remaining_time": "0:00:00"}
{"current_steps": 420, "total_steps": 420, "epoch": 2.9835189309576835, "percentage": 100.0, "elapsed_time": "2:56:45", "remaining_time": "0:00:00"}