backup / Power_Time_SFT /trainer_log.jsonl
wf8888884's picture
Add files using upload-large-folder tool
dfafc69 verified
{"current_steps": 10, "total_steps": 540, "loss": 0.6923, "accuracy": 0.42500001192092896, "learning_rate": 9.259259259259259e-07, "epoch": 0.36199095022624433, "percentage": 1.85, "elapsed_time": "0:01:20", "remaining_time": "1:11:14"}
{"current_steps": 20, "total_steps": 540, "loss": 0.6943, "accuracy": 0.4000000059604645, "learning_rate": 1.8518518518518519e-06, "epoch": 0.7239819004524887, "percentage": 3.7, "elapsed_time": "0:02:36", "remaining_time": "1:07:45"}
{"current_steps": 30, "total_steps": 540, "loss": 0.6924, "accuracy": 0.5625, "learning_rate": 2.7777777777777783e-06, "epoch": 1.085972850678733, "percentage": 5.56, "elapsed_time": "0:03:52", "remaining_time": "1:05:49"}
{"current_steps": 40, "total_steps": 540, "loss": 0.6899, "accuracy": 0.550000011920929, "learning_rate": 3.7037037037037037e-06, "epoch": 1.4479638009049773, "percentage": 7.41, "elapsed_time": "0:05:07", "remaining_time": "1:04:03"}
{"current_steps": 50, "total_steps": 540, "loss": 0.6865, "accuracy": 0.625, "learning_rate": 4.62962962962963e-06, "epoch": 1.8099547511312217, "percentage": 9.26, "elapsed_time": "0:06:25", "remaining_time": "1:02:58"}
{"current_steps": 60, "total_steps": 540, "loss": 0.6775, "accuracy": 0.637499988079071, "learning_rate": 4.998119881260576e-06, "epoch": 2.171945701357466, "percentage": 11.11, "elapsed_time": "0:07:42", "remaining_time": "1:01:41"}
{"current_steps": 70, "total_steps": 540, "loss": 0.6636, "accuracy": 0.6875, "learning_rate": 4.9866405060165044e-06, "epoch": 2.5339366515837103, "percentage": 12.96, "elapsed_time": "0:09:02", "remaining_time": "1:00:45"}
{"current_steps": 80, "total_steps": 540, "loss": 0.6473, "accuracy": 0.75, "learning_rate": 4.964774158361991e-06, "epoch": 2.8959276018099547, "percentage": 14.81, "elapsed_time": "0:10:19", "remaining_time": "0:59:20"}
{"current_steps": 90, "total_steps": 540, "loss": 0.6292, "accuracy": 0.675000011920929, "learning_rate": 4.93261217644956e-06, "epoch": 3.257918552036199, "percentage": 16.67, "elapsed_time": "0:11:35", "remaining_time": "0:57:57"}
{"current_steps": 100, "total_steps": 540, "loss": 0.6015, "accuracy": 0.75, "learning_rate": 4.8902889044347e-06, "epoch": 3.6199095022624435, "percentage": 18.52, "elapsed_time": "0:12:53", "remaining_time": "0:56:45"}
{"current_steps": 110, "total_steps": 540, "loss": 0.582, "accuracy": 0.762499988079071, "learning_rate": 4.837981131305475e-06, "epoch": 3.981900452488688, "percentage": 20.37, "elapsed_time": "0:14:14", "remaining_time": "0:55:38"}
{"current_steps": 120, "total_steps": 540, "loss": 0.5537, "accuracy": 0.75, "learning_rate": 4.775907352415367e-06, "epoch": 4.343891402714932, "percentage": 22.22, "elapsed_time": "0:15:30", "remaining_time": "0:54:18"}
{"current_steps": 130, "total_steps": 540, "loss": 0.5306, "accuracy": 0.800000011920929, "learning_rate": 4.70432685680402e-06, "epoch": 4.705882352941177, "percentage": 24.07, "elapsed_time": "0:16:43", "remaining_time": "0:52:46"}
{"current_steps": 140, "total_steps": 540, "loss": 0.5028, "accuracy": 0.824999988079071, "learning_rate": 4.623538644118244e-06, "epoch": 5.067873303167421, "percentage": 25.93, "elapsed_time": "0:18:04", "remaining_time": "0:51:38"}
{"current_steps": 150, "total_steps": 540, "loss": 0.4663, "accuracy": 0.8125, "learning_rate": 4.533880175657419e-06, "epoch": 5.429864253393665, "percentage": 27.78, "elapsed_time": "0:19:23", "remaining_time": "0:50:24"}
{"current_steps": 160, "total_steps": 540, "loss": 0.4636, "accuracy": 0.875, "learning_rate": 4.435725964760331e-06, "epoch": 5.791855203619909, "percentage": 29.63, "elapsed_time": "0:20:39", "remaining_time": "0:49:04"}
{"current_steps": 170, "total_steps": 540, "loss": 0.4245, "accuracy": 0.949999988079071, "learning_rate": 4.329486012421531e-06, "epoch": 6.153846153846154, "percentage": 31.48, "elapsed_time": "0:21:56", "remaining_time": "0:47:45"}
{"current_steps": 180, "total_steps": 540, "loss": 0.449, "accuracy": 0.9125000238418579, "learning_rate": 4.215604094671835e-06, "epoch": 6.515837104072398, "percentage": 33.33, "elapsed_time": "0:23:15", "remaining_time": "0:46:30"}
{"current_steps": 190, "total_steps": 540, "loss": 0.3764, "accuracy": 0.925000011920929, "learning_rate": 4.094555908876765e-06, "epoch": 6.877828054298643, "percentage": 35.19, "elapsed_time": "0:24:28", "remaining_time": "0:45:05"}
{"current_steps": 200, "total_steps": 540, "loss": 0.3362, "accuracy": 0.949999988079071, "learning_rate": 3.966847086696045e-06, "epoch": 7.239819004524887, "percentage": 37.04, "elapsed_time": "0:25:49", "remaining_time": "0:43:54"}
{"current_steps": 210, "total_steps": 540, "loss": 0.317, "accuracy": 0.987500011920929, "learning_rate": 3.833011082004229e-06, "epoch": 7.601809954751131, "percentage": 38.89, "elapsed_time": "0:27:04", "remaining_time": "0:42:33"}
{"current_steps": 220, "total_steps": 540, "loss": 0.3338, "accuracy": 0.875, "learning_rate": 3.693606942594873e-06, "epoch": 7.963800904977376, "percentage": 40.74, "elapsed_time": "0:28:22", "remaining_time": "0:41:17"}
{"current_steps": 230, "total_steps": 540, "loss": 0.2894, "accuracy": 0.9375, "learning_rate": 3.549216974976073e-06, "epoch": 8.32579185520362, "percentage": 42.59, "elapsed_time": "0:29:36", "remaining_time": "0:39:54"}
{"current_steps": 240, "total_steps": 540, "loss": 0.2666, "accuracy": 0.949999988079071, "learning_rate": 3.400444312011776e-06, "epoch": 8.687782805429864, "percentage": 44.44, "elapsed_time": "0:30:57", "remaining_time": "0:38:41"}
{"current_steps": 250, "total_steps": 540, "loss": 0.2556, "accuracy": 0.9125000238418579, "learning_rate": 3.2479103935691047e-06, "epoch": 9.049773755656108, "percentage": 46.3, "elapsed_time": "0:32:13", "remaining_time": "0:37:22"}
{"current_steps": 260, "total_steps": 540, "loss": 0.223, "accuracy": 1.0, "learning_rate": 3.092252370695298e-06, "epoch": 9.411764705882353, "percentage": 48.15, "elapsed_time": "0:33:32", "remaining_time": "0:36:07"}
{"current_steps": 270, "total_steps": 540, "loss": 0.2108, "accuracy": 0.9624999761581421, "learning_rate": 2.9341204441673267e-06, "epoch": 9.773755656108598, "percentage": 50.0, "elapsed_time": "0:34:49", "remaining_time": "0:34:49"}
{"current_steps": 280, "total_steps": 540, "loss": 0.2067, "accuracy": 0.9624999761581421, "learning_rate": 2.7741751485313295e-06, "epoch": 10.135746606334841, "percentage": 51.85, "elapsed_time": "0:36:07", "remaining_time": "0:33:32"}
{"current_steps": 290, "total_steps": 540, "loss": 0.1791, "accuracy": 0.9750000238418579, "learning_rate": 2.6130845929767662e-06, "epoch": 10.497737556561086, "percentage": 53.7, "elapsed_time": "0:37:27", "remaining_time": "0:32:17"}
{"current_steps": 300, "total_steps": 540, "loss": 0.173, "accuracy": 0.949999988079071, "learning_rate": 2.4515216705704396e-06, "epoch": 10.85972850678733, "percentage": 55.56, "elapsed_time": "0:38:45", "remaining_time": "0:31:00"}
{"current_steps": 310, "total_steps": 540, "loss": 0.1525, "accuracy": 0.9750000238418579, "learning_rate": 2.290161247507733e-06, "epoch": 11.221719457013574, "percentage": 57.41, "elapsed_time": "0:40:04", "remaining_time": "0:29:44"}
{"current_steps": 320, "total_steps": 540, "loss": 0.1367, "accuracy": 0.987500011920929, "learning_rate": 2.129677344121879e-06, "epoch": 11.583710407239819, "percentage": 59.26, "elapsed_time": "0:41:21", "remaining_time": "0:28:25"}
{"current_steps": 330, "total_steps": 540, "loss": 0.1436, "accuracy": 0.9750000238418579, "learning_rate": 1.970740319426474e-06, "epoch": 11.945701357466064, "percentage": 61.11, "elapsed_time": "0:42:37", "remaining_time": "0:27:07"}
{"current_steps": 340, "total_steps": 540, "loss": 0.1185, "accuracy": 0.987500011920929, "learning_rate": 1.8140140709517467e-06, "epoch": 12.307692307692308, "percentage": 62.96, "elapsed_time": "0:43:54", "remaining_time": "0:25:49"}
{"current_steps": 350, "total_steps": 540, "loss": 0.111, "accuracy": 0.987500011920929, "learning_rate": 1.6601532615711452e-06, "epoch": 12.669683257918551, "percentage": 64.81, "elapsed_time": "0:45:11", "remaining_time": "0:24:32"}
{"current_steps": 360, "total_steps": 540, "loss": 0.1133, "accuracy": 0.987500011920929, "learning_rate": 1.509800584902108e-06, "epoch": 13.031674208144796, "percentage": 66.67, "elapsed_time": "0:46:29", "remaining_time": "0:23:14"}
{"current_steps": 370, "total_steps": 540, "loss": 0.0866, "accuracy": 1.0, "learning_rate": 1.3635840807037487e-06, "epoch": 13.393665158371041, "percentage": 68.52, "elapsed_time": "0:47:50", "remaining_time": "0:21:58"}
{"current_steps": 380, "total_steps": 540, "loss": 0.0953, "accuracy": 0.987500011920929, "learning_rate": 1.2221145114853172e-06, "epoch": 13.755656108597286, "percentage": 70.37, "elapsed_time": "0:49:06", "remaining_time": "0:20:40"}
{"current_steps": 390, "total_steps": 540, "loss": 0.0879, "accuracy": 0.987500011920929, "learning_rate": 1.085982811283654e-06, "epoch": 14.117647058823529, "percentage": 72.22, "elapsed_time": "0:50:20", "remaining_time": "0:19:21"}
{"current_steps": 400, "total_steps": 540, "loss": 0.0783, "accuracy": 0.987500011920929, "learning_rate": 9.557576172663577e-07, "epoch": 14.479638009049774, "percentage": 74.07, "elapsed_time": "0:51:37", "remaining_time": "0:18:04"}
{"current_steps": 410, "total_steps": 540, "loss": 0.0818, "accuracy": 1.0, "learning_rate": 8.319828944714508e-07, "epoch": 14.841628959276019, "percentage": 75.93, "elapsed_time": "0:52:54", "remaining_time": "0:16:46"}
{"current_steps": 420, "total_steps": 540, "loss": 0.08, "accuracy": 1.0, "learning_rate": 7.151756636052529e-07, "epoch": 15.203619909502262, "percentage": 77.78, "elapsed_time": "0:54:09", "remaining_time": "0:15:28"}
{"current_steps": 430, "total_steps": 540, "loss": 0.0697, "accuracy": 1.0, "learning_rate": 6.058238413897052e-07, "epoch": 15.565610859728507, "percentage": 79.63, "elapsed_time": "0:55:26", "remaining_time": "0:14:10"}
{"current_steps": 440, "total_steps": 540, "loss": 0.0643, "accuracy": 1.0, "learning_rate": 5.043842024802675e-07, "epoch": 15.927601809954751, "percentage": 81.48, "elapsed_time": "0:56:42", "remaining_time": "0:12:53"}
{"current_steps": 450, "total_steps": 540, "loss": 0.0693, "accuracy": 1.0, "learning_rate": 4.1128047146765936e-07, "epoch": 16.289592760180994, "percentage": 83.33, "elapsed_time": "0:58:03", "remaining_time": "0:11:36"}
{"current_steps": 460, "total_steps": 540, "loss": 0.0608, "accuracy": 1.0, "learning_rate": 3.269015529333805e-07, "epoch": 16.65158371040724, "percentage": 85.19, "elapsed_time": "0:59:17", "remaining_time": "0:10:18"}
{"current_steps": 470, "total_steps": 540, "loss": 0.0617, "accuracy": 1.0, "learning_rate": 2.515999069522676e-07, "epoch": 17.013574660633484, "percentage": 87.04, "elapsed_time": "1:00:38", "remaining_time": "0:09:01"}
{"current_steps": 480, "total_steps": 540, "loss": 0.0602, "accuracy": 0.987500011920929, "learning_rate": 1.8569007682777417e-07, "epoch": 17.375565610859727, "percentage": 88.89, "elapsed_time": "1:01:56", "remaining_time": "0:07:44"}
{"current_steps": 490, "total_steps": 540, "loss": 0.0585, "accuracy": 1.0, "learning_rate": 1.2944737520980883e-07, "epoch": 17.737556561085974, "percentage": 90.74, "elapsed_time": "1:03:11", "remaining_time": "0:06:26"}
{"current_steps": 500, "total_steps": 540, "loss": 0.0617, "accuracy": 1.0, "learning_rate": 8.310673408334496e-08, "epoch": 18.099547511312217, "percentage": 92.59, "elapsed_time": "1:04:33", "remaining_time": "0:05:09"}
{"current_steps": 510, "total_steps": 540, "loss": 0.0639, "accuracy": 1.0, "learning_rate": 4.6861723431538273e-08, "epoch": 18.46153846153846, "percentage": 94.44, "elapsed_time": "1:05:53", "remaining_time": "0:03:52"}
{"current_steps": 520, "total_steps": 540, "loss": 0.0534, "accuracy": 0.987500011920929, "learning_rate": 2.0863742672497244e-08, "epoch": 18.823529411764707, "percentage": 96.3, "elapsed_time": "1:07:03", "remaining_time": "0:02:34"}
{"current_steps": 530, "total_steps": 540, "loss": 0.0605, "accuracy": 0.987500011920929, "learning_rate": 5.221388247169945e-09, "epoch": 19.18552036199095, "percentage": 98.15, "elapsed_time": "1:08:19", "remaining_time": "0:01:17"}
{"current_steps": 540, "total_steps": 540, "loss": 0.0601, "accuracy": 1.0, "learning_rate": 0.0, "epoch": 19.547511312217196, "percentage": 100.0, "elapsed_time": "1:09:31", "remaining_time": "0:00:00"}
{"current_steps": 540, "total_steps": 540, "epoch": 19.547511312217196, "percentage": 100.0, "elapsed_time": "1:09:32", "remaining_time": "0:00:00"}