backup / Area_SFT /trainer_log.jsonl
wf8888884's picture
Add files using upload-large-folder tool
db6ca4b verified
{"current_steps": 110, "total_steps": 580, "loss": 0.5908, "accuracy": 0.8374999761581421, "learning_rate": 4.878569458453592e-06, "epoch": 3.7698744769874475, "percentage": 18.97, "elapsed_time": "0:01:18", "remaining_time": "0:05:35"}
{"current_steps": 120, "total_steps": 580, "loss": 0.5783, "accuracy": 0.8999999761581421, "learning_rate": 4.827968782785062e-06, "epoch": 4.104602510460251, "percentage": 20.69, "elapsed_time": "0:02:30", "remaining_time": "0:09:38"}
{"current_steps": 130, "total_steps": 580, "loss": 0.5338, "accuracy": 0.8999999761581421, "learning_rate": 4.7689385491773934e-06, "epoch": 4.439330543933054, "percentage": 22.41, "elapsed_time": "0:03:46", "remaining_time": "0:13:04"}
{"current_steps": 140, "total_steps": 580, "loss": 0.5215, "accuracy": 0.824999988079071, "learning_rate": 4.70169250567482e-06, "epoch": 4.7740585774058575, "percentage": 24.14, "elapsed_time": "0:04:58", "remaining_time": "0:15:38"}
{"current_steps": 150, "total_steps": 580, "loss": 0.5019, "accuracy": 0.8500000238418579, "learning_rate": 4.626474149709127e-06, "epoch": 5.108786610878661, "percentage": 25.86, "elapsed_time": "0:06:19", "remaining_time": "0:18:07"}
{"current_steps": 160, "total_steps": 580, "loss": 0.4586, "accuracy": 0.824999988079071, "learning_rate": 4.54355584639723e-06, "epoch": 5.443514644351464, "percentage": 27.59, "elapsed_time": "0:07:35", "remaining_time": "0:19:55"}
{"current_steps": 170, "total_steps": 580, "loss": 0.4442, "accuracy": 0.887499988079071, "learning_rate": 4.45323784230908e-06, "epoch": 5.7782426778242675, "percentage": 29.31, "elapsed_time": "0:08:56", "remaining_time": "0:21:33"}
{"current_steps": 180, "total_steps": 580, "loss": 0.4355, "accuracy": 0.8999999761581421, "learning_rate": 4.355847178277025e-06, "epoch": 6.112970711297071, "percentage": 31.03, "elapsed_time": "0:10:11", "remaining_time": "0:22:39"}
{"current_steps": 190, "total_steps": 580, "loss": 0.3719, "accuracy": 0.925000011920929, "learning_rate": 4.2517365051833564e-06, "epoch": 6.447698744769874, "percentage": 32.76, "elapsed_time": "0:11:29", "remaining_time": "0:23:34"}
{"current_steps": 200, "total_steps": 580, "loss": 0.3829, "accuracy": 0.9375, "learning_rate": 4.141282807014034e-06, "epoch": 6.7824267782426775, "percentage": 34.48, "elapsed_time": "0:12:44", "remaining_time": "0:24:12"}
{"current_steps": 210, "total_steps": 580, "loss": 0.3522, "accuracy": 0.925000011920929, "learning_rate": 4.024886035802432e-06, "epoch": 7.117154811715481, "percentage": 36.21, "elapsed_time": "0:14:06", "remaining_time": "0:24:50"}
{"current_steps": 220, "total_steps": 580, "loss": 0.3219, "accuracy": 0.8999999761581421, "learning_rate": 3.9029676634059565e-06, "epoch": 7.451882845188284, "percentage": 37.93, "elapsed_time": "0:15:21", "remaining_time": "0:25:08"}
{"current_steps": 230, "total_steps": 580, "loss": 0.3041, "accuracy": 0.9125000238418579, "learning_rate": 3.7759691553595214e-06, "epoch": 7.786610878661088, "percentage": 39.66, "elapsed_time": "0:16:46", "remaining_time": "0:25:31"}
{"current_steps": 240, "total_steps": 580, "loss": 0.3065, "accuracy": 0.9125000238418579, "learning_rate": 3.6443503723320837e-06, "epoch": 8.121338912133892, "percentage": 41.38, "elapsed_time": "0:18:01", "remaining_time": "0:25:31"}
{"current_steps": 250, "total_steps": 580, "loss": 0.2498, "accuracy": 0.9750000238418579, "learning_rate": 3.508587904974522e-06, "epoch": 8.456066945606695, "percentage": 43.1, "elapsed_time": "0:19:23", "remaining_time": "0:25:35"}
{"current_steps": 260, "total_steps": 580, "loss": 0.2532, "accuracy": 0.925000011920929, "learning_rate": 3.3691733481883693e-06, "epoch": 8.790794979079498, "percentage": 44.83, "elapsed_time": "0:20:41", "remaining_time": "0:25:28"}
{"current_steps": 270, "total_steps": 580, "loss": 0.2314, "accuracy": 0.9750000238418579, "learning_rate": 3.226611521064278e-06, "epoch": 9.125523012552302, "percentage": 46.55, "elapsed_time": "0:21:51", "remaining_time": "0:25:06"}
{"current_steps": 280, "total_steps": 580, "loss": 0.2142, "accuracy": 0.9624999761581421, "learning_rate": 3.0814186389357765e-06, "epoch": 9.460251046025105, "percentage": 48.28, "elapsed_time": "0:23:10", "remaining_time": "0:24:49"}
{"current_steps": 290, "total_steps": 580, "loss": 0.1881, "accuracy": 1.0, "learning_rate": 2.9341204441673267e-06, "epoch": 9.794979079497908, "percentage": 50.0, "elapsed_time": "0:24:25", "remaining_time": "0:24:25"}
{"current_steps": 300, "total_steps": 580, "loss": 0.1798, "accuracy": 0.9624999761581421, "learning_rate": 2.785250302445062e-06, "epoch": 10.129707112970712, "percentage": 51.72, "elapsed_time": "0:25:46", "remaining_time": "0:24:02"}
{"current_steps": 310, "total_steps": 580, "loss": 0.1558, "accuracy": 0.987500011920929, "learning_rate": 2.6353472714635443e-06, "epoch": 10.464435146443515, "percentage": 53.45, "elapsed_time": "0:27:07", "remaining_time": "0:23:37"}
{"current_steps": 320, "total_steps": 580, "loss": 0.1538, "accuracy": 0.9750000238418579, "learning_rate": 2.4849541490017868e-06, "epoch": 10.799163179916318, "percentage": 55.17, "elapsed_time": "0:28:28", "remaining_time": "0:23:08"}
{"current_steps": 330, "total_steps": 580, "loss": 0.1373, "accuracy": 0.9750000238418579, "learning_rate": 2.3346155074564712e-06, "epoch": 11.133891213389122, "percentage": 56.9, "elapsed_time": "0:29:46", "remaining_time": "0:22:33"}
{"current_steps": 340, "total_steps": 580, "loss": 0.1257, "accuracy": 0.9624999761581421, "learning_rate": 2.184875721949277e-06, "epoch": 11.468619246861925, "percentage": 58.62, "elapsed_time": "0:31:01", "remaining_time": "0:21:54"}
{"current_steps": 350, "total_steps": 580, "loss": 0.1184, "accuracy": 0.987500011920929, "learning_rate": 2.0362769991485514e-06, "epoch": 11.803347280334728, "percentage": 60.34, "elapsed_time": "0:32:21", "remaining_time": "0:21:16"}
{"current_steps": 360, "total_steps": 580, "loss": 0.1106, "accuracy": 0.987500011920929, "learning_rate": 1.8893574139429226e-06, "epoch": 12.138075313807532, "percentage": 62.07, "elapsed_time": "0:33:37", "remaining_time": "0:20:33"}
{"current_steps": 370, "total_steps": 580, "loss": 0.0907, "accuracy": 0.9750000238418579, "learning_rate": 1.744648961076068e-06, "epoch": 12.472803347280335, "percentage": 63.79, "elapsed_time": "0:34:56", "remaining_time": "0:19:50"}
{"current_steps": 380, "total_steps": 580, "loss": 0.0923, "accuracy": 1.0, "learning_rate": 1.602675628797636e-06, "epoch": 12.807531380753138, "percentage": 65.52, "elapsed_time": "0:36:17", "remaining_time": "0:19:06"}
{"current_steps": 390, "total_steps": 580, "loss": 0.0876, "accuracy": 0.9624999761581421, "learning_rate": 1.4639515015056205e-06, "epoch": 13.142259414225942, "percentage": 67.24, "elapsed_time": "0:37:36", "remaining_time": "0:18:19"}
{"current_steps": 400, "total_steps": 580, "loss": 0.0662, "accuracy": 1.0, "learning_rate": 1.328978898250525e-06, "epoch": 13.476987447698745, "percentage": 68.97, "elapsed_time": "0:38:56", "remaining_time": "0:17:31"}
{"current_steps": 410, "total_steps": 580, "loss": 0.0808, "accuracy": 0.987500011920929, "learning_rate": 1.198246553841744e-06, "epoch": 13.811715481171548, "percentage": 70.69, "elapsed_time": "0:40:12", "remaining_time": "0:16:40"}
{"current_steps": 420, "total_steps": 580, "loss": 0.0651, "accuracy": 1.0, "learning_rate": 1.0722278491423998e-06, "epoch": 14.146443514644352, "percentage": 72.41, "elapsed_time": "0:41:32", "remaining_time": "0:15:49"}
{"current_steps": 430, "total_steps": 580, "loss": 0.0609, "accuracy": 1.0, "learning_rate": 9.513790969606926e-07, "epoch": 14.481171548117155, "percentage": 74.14, "elapsed_time": "0:42:48", "remaining_time": "0:14:55"}
{"current_steps": 440, "total_steps": 580, "loss": 0.0624, "accuracy": 1.0, "learning_rate": 8.361378897445643e-07, "epoch": 14.815899581589958, "percentage": 75.86, "elapsed_time": "0:44:05", "remaining_time": "0:14:01"}
{"current_steps": 450, "total_steps": 580, "loss": 0.0513, "accuracy": 1.0, "learning_rate": 7.269215150626391e-07, "epoch": 15.150627615062762, "percentage": 77.59, "elapsed_time": "0:45:17", "remaining_time": "0:13:05"}
{"current_steps": 460, "total_steps": 580, "loss": 0.0588, "accuracy": 0.987500011920929, "learning_rate": 6.241254446089942e-07, "epoch": 15.485355648535565, "percentage": 79.31, "elapsed_time": "0:46:31", "remaining_time": "0:12:08"}
{"current_steps": 470, "total_steps": 580, "loss": 0.0484, "accuracy": 1.0, "learning_rate": 5.281219022030423e-07, "epoch": 15.820083682008368, "percentage": 81.03, "elapsed_time": "0:47:50", "remaining_time": "0:11:11"}
{"current_steps": 480, "total_steps": 580, "loss": 0.0443, "accuracy": 1.0, "learning_rate": 4.392585159698087e-07, "epoch": 16.15481171548117, "percentage": 82.76, "elapsed_time": "0:49:06", "remaining_time": "0:10:13"}
{"current_steps": 490, "total_steps": 580, "loss": 0.0483, "accuracy": 1.0, "learning_rate": 3.578570595810274e-07, "epoch": 16.489539748953973, "percentage": 84.48, "elapsed_time": "0:50:20", "remaining_time": "0:09:14"}
{"current_steps": 500, "total_steps": 580, "loss": 0.0468, "accuracy": 1.0, "learning_rate": 2.8421228711503127e-07, "epoch": 16.824267782426777, "percentage": 86.21, "elapsed_time": "0:51:36", "remaining_time": "0:08:15"}
{"current_steps": 510, "total_steps": 580, "loss": 0.0398, "accuracy": 1.0, "learning_rate": 2.1859086575439225e-07, "epoch": 17.15899581589958, "percentage": 87.93, "elapsed_time": "0:52:54", "remaining_time": "0:07:15"}
{"current_steps": 520, "total_steps": 580, "loss": 0.0436, "accuracy": 1.0, "learning_rate": 1.6123041018599766e-07, "epoch": 17.493723849372383, "percentage": 89.66, "elapsed_time": "0:54:14", "remaining_time": "0:06:15"}
{"current_steps": 530, "total_steps": 580, "loss": 0.0477, "accuracy": 1.0, "learning_rate": 1.1233862220001168e-07, "epoch": 17.828451882845187, "percentage": 91.38, "elapsed_time": "0:55:34", "remaining_time": "0:05:14"}
{"current_steps": 540, "total_steps": 580, "loss": 0.0408, "accuracy": 1.0, "learning_rate": 7.209253860320897e-08, "epoch": 18.16317991631799, "percentage": 93.1, "elapsed_time": "0:56:54", "remaining_time": "0:04:12"}
{"current_steps": 550, "total_steps": 580, "loss": 0.0423, "accuracy": 1.0, "learning_rate": 4.063789016999331e-08, "epoch": 18.497907949790793, "percentage": 94.83, "elapsed_time": "0:58:10", "remaining_time": "0:03:10"}
{"current_steps": 560, "total_steps": 580, "loss": 0.04, "accuracy": 1.0, "learning_rate": 1.808857395232788e-08, "epoch": 18.8326359832636, "percentage": 96.55, "elapsed_time": "0:59:27", "remaining_time": "0:02:07"}
{"current_steps": 570, "total_steps": 580, "loss": 0.041, "accuracy": 1.0, "learning_rate": 4.526240859345499e-09, "epoch": 19.1673640167364, "percentage": 98.28, "elapsed_time": "1:00:47", "remaining_time": "0:01:03"}
{"current_steps": 580, "total_steps": 580, "loss": 0.0408, "accuracy": 0.987500011920929, "learning_rate": 0.0, "epoch": 19.502092050209207, "percentage": 100.0, "elapsed_time": "1:02:03", "remaining_time": "0:00:00"}
{"current_steps": 580, "total_steps": 580, "epoch": 19.502092050209207, "percentage": 100.0, "elapsed_time": "1:02:04", "remaining_time": "0:00:00"}