llama3_lora / trainer_log.jsonl
fzkun's picture
Upload folder using huggingface_hub
2b770f0 verified
{"current_steps": 5, "total_steps": 258, "loss": 1.5305, "lr": 9.615384615384616e-06, "epoch": 0.057803468208092484, "percentage": 1.94, "elapsed_time": "0:00:48", "remaining_time": "0:40:49"}
{"current_steps": 10, "total_steps": 258, "loss": 1.3586, "lr": 1.923076923076923e-05, "epoch": 0.11560693641618497, "percentage": 3.88, "elapsed_time": "0:01:37", "remaining_time": "0:40:19"}
{"current_steps": 15, "total_steps": 258, "loss": 1.3282, "lr": 2.8846153846153845e-05, "epoch": 0.17341040462427745, "percentage": 5.81, "elapsed_time": "0:02:28", "remaining_time": "0:40:04"}
{"current_steps": 20, "total_steps": 258, "loss": 1.246, "lr": 3.846153846153846e-05, "epoch": 0.23121387283236994, "percentage": 7.75, "elapsed_time": "0:03:18", "remaining_time": "0:39:22"}
{"current_steps": 25, "total_steps": 258, "loss": 1.3034, "lr": 4.8076923076923084e-05, "epoch": 0.28901734104046245, "percentage": 9.69, "elapsed_time": "0:04:10", "remaining_time": "0:38:51"}
{"current_steps": 30, "total_steps": 258, "loss": 1.1816, "lr": 4.996333534627809e-05, "epoch": 0.3468208092485549, "percentage": 11.63, "elapsed_time": "0:05:02", "remaining_time": "0:38:21"}
{"current_steps": 35, "total_steps": 258, "loss": 1.2341, "lr": 4.981456948708014e-05, "epoch": 0.4046242774566474, "percentage": 13.57, "elapsed_time": "0:05:48", "remaining_time": "0:36:58"}
{"current_steps": 40, "total_steps": 258, "loss": 1.2838, "lr": 4.95520920685539e-05, "epoch": 0.4624277456647399, "percentage": 15.5, "elapsed_time": "0:06:39", "remaining_time": "0:36:17"}
{"current_steps": 45, "total_steps": 258, "loss": 1.2135, "lr": 4.9177105880720173e-05, "epoch": 0.5202312138728323, "percentage": 17.44, "elapsed_time": "0:07:28", "remaining_time": "0:35:24"}
{"current_steps": 50, "total_steps": 258, "loss": 1.11, "lr": 4.869132927957007e-05, "epoch": 0.5780346820809249, "percentage": 19.38, "elapsed_time": "0:08:23", "remaining_time": "0:34:52"}
{"current_steps": 55, "total_steps": 258, "loss": 1.2103, "lr": 4.8096988312782174e-05, "epoch": 0.6358381502890174, "percentage": 21.32, "elapsed_time": "0:09:17", "remaining_time": "0:34:17"}
{"current_steps": 60, "total_steps": 258, "loss": 1.2226, "lr": 4.73968065189672e-05, "epoch": 0.6936416184971098, "percentage": 23.26, "elapsed_time": "0:10:05", "remaining_time": "0:33:17"}
{"current_steps": 65, "total_steps": 258, "loss": 1.1403, "lr": 4.6593992447184586e-05, "epoch": 0.7514450867052023, "percentage": 25.19, "elapsed_time": "0:10:58", "remaining_time": "0:32:35"}
{"current_steps": 70, "total_steps": 258, "loss": 1.1933, "lr": 4.5692224953922266e-05, "epoch": 0.8092485549132948, "percentage": 27.13, "elapsed_time": "0:11:50", "remaining_time": "0:31:49"}
{"current_steps": 75, "total_steps": 258, "loss": 1.1941, "lr": 4.469563634491554e-05, "epoch": 0.8670520231213873, "percentage": 29.07, "elapsed_time": "0:12:37", "remaining_time": "0:30:47"}
{"current_steps": 80, "total_steps": 258, "loss": 1.3349, "lr": 4.360879343905676e-05, "epoch": 0.9248554913294798, "percentage": 31.01, "elapsed_time": "0:13:20", "remaining_time": "0:29:42"}
{"current_steps": 85, "total_steps": 258, "loss": 1.3004, "lr": 4.243667664116956e-05, "epoch": 0.9826589595375722, "percentage": 32.95, "elapsed_time": "0:14:04", "remaining_time": "0:28:39"}
{"current_steps": 90, "total_steps": 258, "loss": 1.0116, "lr": 4.118465711954569e-05, "epoch": 1.0346820809248556, "percentage": 34.88, "elapsed_time": "0:14:46", "remaining_time": "0:27:35"}
{"current_steps": 95, "total_steps": 258, "loss": 0.8764, "lr": 3.985847219282725e-05, "epoch": 1.092485549132948, "percentage": 36.82, "elapsed_time": "0:15:34", "remaining_time": "0:26:43"}
{"current_steps": 100, "total_steps": 258, "loss": 0.9051, "lr": 3.8464199039022605e-05, "epoch": 1.1502890173410405, "percentage": 38.76, "elapsed_time": "0:16:27", "remaining_time": "0:25:59"}
{"current_steps": 105, "total_steps": 258, "loss": 0.9408, "lr": 3.700822684713349e-05, "epoch": 1.208092485549133, "percentage": 40.7, "elapsed_time": "0:17:16", "remaining_time": "0:25:10"}
{"current_steps": 110, "total_steps": 258, "loss": 0.7376, "lr": 3.5497227539006614e-05, "epoch": 1.2658959537572254, "percentage": 42.64, "elapsed_time": "0:18:07", "remaining_time": "0:24:23"}
{"current_steps": 115, "total_steps": 258, "loss": 0.9192, "lr": 3.3938125195576e-05, "epoch": 1.323699421965318, "percentage": 44.57, "elapsed_time": "0:18:54", "remaining_time": "0:23:31"}
{"current_steps": 120, "total_steps": 258, "loss": 0.7502, "lr": 3.233806432759837e-05, "epoch": 1.3815028901734103, "percentage": 46.51, "elapsed_time": "0:19:44", "remaining_time": "0:22:41"}
{"current_steps": 125, "total_steps": 258, "loss": 0.7896, "lr": 3.070437713627965e-05, "epoch": 1.439306358381503, "percentage": 48.45, "elapsed_time": "0:20:33", "remaining_time": "0:21:52"}
{"current_steps": 130, "total_steps": 258, "loss": 0.7826, "lr": 2.9044549913819124e-05, "epoch": 1.4971098265895955, "percentage": 50.39, "elapsed_time": "0:21:26", "remaining_time": "0:21:07"}
{"current_steps": 135, "total_steps": 258, "loss": 0.7622, "lr": 2.7366188737839026e-05, "epoch": 1.5549132947976878, "percentage": 52.33, "elapsed_time": "0:22:19", "remaining_time": "0:20:20"}
{"current_steps": 140, "total_steps": 258, "loss": 0.6622, "lr": 2.5676984616903367e-05, "epoch": 1.6127167630057804, "percentage": 54.26, "elapsed_time": "0:23:14", "remaining_time": "0:19:35"}
{"current_steps": 145, "total_steps": 258, "loss": 0.809, "lr": 2.3984678246844677e-05, "epoch": 1.6705202312138727, "percentage": 56.2, "elapsed_time": "0:24:02", "remaining_time": "0:18:44"}
{"current_steps": 150, "total_steps": 258, "loss": 0.7095, "lr": 2.2297024539401463e-05, "epoch": 1.7283236994219653, "percentage": 58.14, "elapsed_time": "0:24:53", "remaining_time": "0:17:55"}
{"current_steps": 155, "total_steps": 258, "loss": 0.8316, "lr": 2.0621757085711734e-05, "epoch": 1.7861271676300579, "percentage": 60.08, "elapsed_time": "0:25:41", "remaining_time": "0:17:04"}
{"current_steps": 160, "total_steps": 258, "loss": 0.7683, "lr": 1.8966552717507364e-05, "epoch": 1.8439306358381504, "percentage": 62.02, "elapsed_time": "0:26:28", "remaining_time": "0:16:12"}
{"current_steps": 165, "total_steps": 258, "loss": 0.7656, "lr": 1.7338996328405526e-05, "epoch": 1.9017341040462428, "percentage": 63.95, "elapsed_time": "0:27:21", "remaining_time": "0:15:25"}
{"current_steps": 170, "total_steps": 258, "loss": 0.7079, "lr": 1.574654611650214e-05, "epoch": 1.9595375722543351, "percentage": 65.89, "elapsed_time": "0:28:10", "remaining_time": "0:14:35"}
{"current_steps": 175, "total_steps": 258, "loss": 0.7448, "lr": 1.4196499407541359e-05, "epoch": 2.0115606936416186, "percentage": 67.83, "elapsed_time": "0:28:59", "remaining_time": "0:13:45"}
{"current_steps": 180, "total_steps": 258, "loss": 0.5049, "lr": 1.2695959215274816e-05, "epoch": 2.069364161849711, "percentage": 69.77, "elapsed_time": "0:29:50", "remaining_time": "0:12:55"}
{"current_steps": 185, "total_steps": 258, "loss": 0.4581, "lr": 1.125180169224613e-05, "epoch": 2.1271676300578033, "percentage": 71.71, "elapsed_time": "0:30:42", "remaining_time": "0:12:07"}
{"current_steps": 190, "total_steps": 258, "loss": 0.4307, "lr": 9.870644620155877e-06, "epoch": 2.184971098265896, "percentage": 73.64, "elapsed_time": "0:31:31", "remaining_time": "0:11:16"}
{"current_steps": 195, "total_steps": 258, "loss": 0.4858, "lr": 8.558817084198387e-06, "epoch": 2.2427745664739884, "percentage": 75.58, "elapsed_time": "0:32:17", "remaining_time": "0:10:25"}
{"current_steps": 200, "total_steps": 258, "loss": 0.4745, "lr": 7.3223304703363135e-06, "epoch": 2.300578034682081, "percentage": 77.52, "elapsed_time": "0:33:06", "remaining_time": "0:09:36"}
{"current_steps": 205, "total_steps": 258, "loss": 0.5683, "lr": 6.166850918416406e-06, "epoch": 2.3583815028901736, "percentage": 79.46, "elapsed_time": "0:33:59", "remaining_time": "0:08:47"}
{"current_steps": 210, "total_steps": 258, "loss": 0.466, "lr": 5.097673357358907e-06, "epoch": 2.416184971098266, "percentage": 81.4, "elapsed_time": "0:34:49", "remaining_time": "0:07:57"}
{"current_steps": 215, "total_steps": 258, "loss": 0.4577, "lr": 4.119697241402998e-06, "epoch": 2.4739884393063583, "percentage": 83.33, "elapsed_time": "0:35:38", "remaining_time": "0:07:07"}
{"current_steps": 220, "total_steps": 258, "loss": 0.3862, "lr": 3.2374040985957004e-06, "epoch": 2.531791907514451, "percentage": 85.27, "elapsed_time": "0:36:24", "remaining_time": "0:06:17"}
{"current_steps": 225, "total_steps": 258, "loss": 0.4205, "lr": 2.4548369944073004e-06, "epoch": 2.5895953757225434, "percentage": 87.21, "elapsed_time": "0:37:15", "remaining_time": "0:05:27"}
{"current_steps": 230, "total_steps": 258, "loss": 0.3581, "lr": 1.7755820045802145e-06, "epoch": 2.647398843930636, "percentage": 89.15, "elapsed_time": "0:38:06", "remaining_time": "0:04:38"}
{"current_steps": 235, "total_steps": 258, "loss": 0.4342, "lr": 1.2027517821111112e-06, "epoch": 2.705202312138728, "percentage": 91.09, "elapsed_time": "0:38:56", "remaining_time": "0:03:48"}
{"current_steps": 240, "total_steps": 258, "loss": 0.4275, "lr": 7.389712936697129e-07, "epoch": 2.7630057803468207, "percentage": 93.02, "elapsed_time": "0:39:43", "remaining_time": "0:02:58"}
{"current_steps": 245, "total_steps": 258, "loss": 0.4198, "lr": 3.8636579081657577e-07, "epoch": 2.820809248554913, "percentage": 94.96, "elapsed_time": "0:40:38", "remaining_time": "0:02:09"}
{"current_steps": 250, "total_steps": 258, "loss": 0.5151, "lr": 1.4655107114101007e-07, "epoch": 2.878612716763006, "percentage": 96.9, "elapsed_time": "0:41:35", "remaining_time": "0:01:19"}
{"current_steps": 255, "total_steps": 258, "loss": 0.4155, "lr": 2.0626073947138668e-08, "epoch": 2.9364161849710984, "percentage": 98.84, "elapsed_time": "0:42:25", "remaining_time": "0:00:29"}
{"current_steps": 258, "total_steps": 258, "epoch": 2.9710982658959537, "percentage": 100.0, "elapsed_time": "0:42:58", "remaining_time": "0:00:00"}