climate-1day / trainer_log.jsonl
Howard881010's picture
Upload folder using huggingface_hub
f696f1e verified
{"current_steps": 10, "total_steps": 375, "loss": 1.8708, "lr": 9.982464296247522e-05, "epoch": 0.02666666666666667, "percentage": 2.67, "elapsed_time": "0:00:31", "remaining_time": "0:19:05"}
{"current_steps": 10, "total_steps": 375, "eval_loss": 1.7566570043563843, "epoch": 0.02666666666666667, "percentage": 2.67, "elapsed_time": "0:01:12", "remaining_time": "0:43:48"}
{"current_steps": 20, "total_steps": 375, "loss": 1.7168, "lr": 9.929980185352526e-05, "epoch": 0.05333333333333334, "percentage": 5.33, "elapsed_time": "0:01:43", "remaining_time": "0:30:39"}
{"current_steps": 20, "total_steps": 375, "eval_loss": 1.6883971691131592, "epoch": 0.05333333333333334, "percentage": 5.33, "elapsed_time": "0:02:24", "remaining_time": "0:42:45"}
{"current_steps": 30, "total_steps": 375, "loss": 1.6815, "lr": 9.842915805643155e-05, "epoch": 0.08, "percentage": 8.0, "elapsed_time": "0:02:56", "remaining_time": "0:33:45"}
{"current_steps": 30, "total_steps": 375, "eval_loss": 1.649947166442871, "epoch": 0.08, "percentage": 8.0, "elapsed_time": "0:03:37", "remaining_time": "0:41:36"}
{"current_steps": 40, "total_steps": 375, "loss": 1.6333, "lr": 9.721881851187406e-05, "epoch": 0.10666666666666667, "percentage": 10.67, "elapsed_time": "0:04:07", "remaining_time": "0:34:32"}
{"current_steps": 40, "total_steps": 375, "eval_loss": 1.6236332654953003, "epoch": 0.10666666666666667, "percentage": 10.67, "elapsed_time": "0:04:48", "remaining_time": "0:40:14"}
{"current_steps": 50, "total_steps": 375, "loss": 1.6028, "lr": 9.567727288213005e-05, "epoch": 0.13333333333333333, "percentage": 13.33, "elapsed_time": "0:05:20", "remaining_time": "0:34:40"}
{"current_steps": 50, "total_steps": 375, "eval_loss": 1.6038854122161865, "epoch": 0.13333333333333333, "percentage": 13.33, "elapsed_time": "0:06:01", "remaining_time": "0:39:06"}
{"current_steps": 60, "total_steps": 375, "loss": 1.5665, "lr": 9.381533400219318e-05, "epoch": 0.16, "percentage": 16.0, "elapsed_time": "0:06:32", "remaining_time": "0:34:19"}
{"current_steps": 60, "total_steps": 375, "eval_loss": 1.5894596576690674, "epoch": 0.16, "percentage": 16.0, "elapsed_time": "0:07:13", "remaining_time": "0:37:54"}
{"current_steps": 70, "total_steps": 375, "loss": 1.574, "lr": 9.164606203550497e-05, "epoch": 0.18666666666666668, "percentage": 18.67, "elapsed_time": "0:07:45", "remaining_time": "0:33:47"}
{"current_steps": 70, "total_steps": 375, "eval_loss": 1.5772351026535034, "epoch": 0.18666666666666668, "percentage": 18.67, "elapsed_time": "0:08:26", "remaining_time": "0:36:45"}
{"current_steps": 80, "total_steps": 375, "loss": 1.5862, "lr": 8.9184672866292e-05, "epoch": 0.21333333333333335, "percentage": 21.33, "elapsed_time": "0:08:55", "remaining_time": "0:32:56"}
{"current_steps": 80, "total_steps": 375, "eval_loss": 1.5647927522659302, "epoch": 0.21333333333333335, "percentage": 21.33, "elapsed_time": "0:09:36", "remaining_time": "0:35:26"}
{"current_steps": 90, "total_steps": 375, "loss": 1.5218, "lr": 8.644843137107059e-05, "epoch": 0.24, "percentage": 24.0, "elapsed_time": "0:10:07", "remaining_time": "0:32:04"}
{"current_steps": 90, "total_steps": 375, "eval_loss": 1.556412696838379, "epoch": 0.24, "percentage": 24.0, "elapsed_time": "0:10:48", "remaining_time": "0:34:13"}
{"current_steps": 100, "total_steps": 375, "loss": 1.5451, "lr": 8.345653031794292e-05, "epoch": 0.26666666666666666, "percentage": 26.67, "elapsed_time": "0:11:18", "remaining_time": "0:31:04"}
{"current_steps": 100, "total_steps": 375, "eval_loss": 1.5465766191482544, "epoch": 0.26666666666666666, "percentage": 26.67, "elapsed_time": "0:11:59", "remaining_time": "0:32:57"}
{"current_steps": 110, "total_steps": 375, "loss": 1.5011, "lr": 8.022995574311876e-05, "epoch": 0.29333333333333333, "percentage": 29.33, "elapsed_time": "0:12:31", "remaining_time": "0:30:11"}
{"current_steps": 110, "total_steps": 375, "eval_loss": 1.5382152795791626, "epoch": 0.29333333333333333, "percentage": 29.33, "elapsed_time": "0:13:12", "remaining_time": "0:31:49"}
{"current_steps": 120, "total_steps": 375, "loss": 1.5182, "lr": 7.679133974894983e-05, "epoch": 0.32, "percentage": 32.0, "elapsed_time": "0:13:44", "remaining_time": "0:29:12"}
{"current_steps": 120, "total_steps": 375, "eval_loss": 1.5328434705734253, "epoch": 0.32, "percentage": 32.0, "elapsed_time": "0:14:25", "remaining_time": "0:30:39"}
{"current_steps": 130, "total_steps": 375, "loss": 1.5331, "lr": 7.316480175599309e-05, "epoch": 0.3466666666666667, "percentage": 34.67, "elapsed_time": "0:14:55", "remaining_time": "0:28:07"}
{"current_steps": 130, "total_steps": 375, "eval_loss": 1.524049997329712, "epoch": 0.3466666666666667, "percentage": 34.67, "elapsed_time": "0:15:36", "remaining_time": "0:29:24"}
{"current_steps": 140, "total_steps": 375, "loss": 1.5096, "lr": 6.937577932260515e-05, "epoch": 0.37333333333333335, "percentage": 37.33, "elapsed_time": "0:16:07", "remaining_time": "0:27:04"}
{"current_steps": 140, "total_steps": 375, "eval_loss": 1.5180366039276123, "epoch": 0.37333333333333335, "percentage": 37.33, "elapsed_time": "0:16:48", "remaining_time": "0:28:13"}
{"current_steps": 150, "total_steps": 375, "loss": 1.5433, "lr": 6.545084971874738e-05, "epoch": 0.4, "percentage": 40.0, "elapsed_time": "0:17:20", "remaining_time": "0:26:00"}
{"current_steps": 150, "total_steps": 375, "eval_loss": 1.5124986171722412, "epoch": 0.4, "percentage": 40.0, "elapsed_time": "0:18:01", "remaining_time": "0:27:01"}
{"current_steps": 160, "total_steps": 375, "loss": 1.4919, "lr": 6.141754350553279e-05, "epoch": 0.4266666666666667, "percentage": 42.67, "elapsed_time": "0:18:32", "remaining_time": "0:24:54"}
{"current_steps": 160, "total_steps": 375, "eval_loss": 1.5082223415374756, "epoch": 0.4266666666666667, "percentage": 42.67, "elapsed_time": "0:19:13", "remaining_time": "0:25:49"}
{"current_steps": 170, "total_steps": 375, "loss": 1.5119, "lr": 5.730415142812059e-05, "epoch": 0.4533333333333333, "percentage": 45.33, "elapsed_time": "0:19:45", "remaining_time": "0:23:49"}
{"current_steps": 170, "total_steps": 375, "eval_loss": 1.5036897659301758, "epoch": 0.4533333333333333, "percentage": 45.33, "elapsed_time": "0:20:26", "remaining_time": "0:24:38"}
{"current_steps": 180, "total_steps": 375, "loss": 1.4898, "lr": 5.313952597646568e-05, "epoch": 0.48, "percentage": 48.0, "elapsed_time": "0:20:57", "remaining_time": "0:22:42"}
{"current_steps": 180, "total_steps": 375, "eval_loss": 1.4962352514266968, "epoch": 0.48, "percentage": 48.0, "elapsed_time": "0:21:38", "remaining_time": "0:23:26"}
{"current_steps": 190, "total_steps": 375, "loss": 1.4879, "lr": 4.895287900583216e-05, "epoch": 0.5066666666666667, "percentage": 50.67, "elapsed_time": "0:22:09", "remaining_time": "0:21:34"}
{"current_steps": 190, "total_steps": 375, "eval_loss": 1.4909743070602417, "epoch": 0.5066666666666667, "percentage": 50.67, "elapsed_time": "0:22:50", "remaining_time": "0:22:14"}
{"current_steps": 200, "total_steps": 375, "loss": 1.4813, "lr": 4.477357683661734e-05, "epoch": 0.5333333333333333, "percentage": 53.33, "elapsed_time": "0:23:20", "remaining_time": "0:20:25"}
{"current_steps": 200, "total_steps": 375, "eval_loss": 1.48694908618927, "epoch": 0.5333333333333333, "percentage": 53.33, "elapsed_time": "0:24:01", "remaining_time": "0:21:01"}
{"current_steps": 210, "total_steps": 375, "loss": 1.4776, "lr": 4.063093427071376e-05, "epoch": 0.56, "percentage": 56.0, "elapsed_time": "0:24:33", "remaining_time": "0:19:17"}
{"current_steps": 210, "total_steps": 375, "eval_loss": 1.482069730758667, "epoch": 0.56, "percentage": 56.0, "elapsed_time": "0:25:14", "remaining_time": "0:19:49"}
{"current_steps": 220, "total_steps": 375, "loss": 1.4786, "lr": 3.655400896923672e-05, "epoch": 0.5866666666666667, "percentage": 58.67, "elapsed_time": "0:25:44", "remaining_time": "0:18:08"}
{"current_steps": 220, "total_steps": 375, "eval_loss": 1.4782707691192627, "epoch": 0.5866666666666667, "percentage": 58.67, "elapsed_time": "0:26:25", "remaining_time": "0:18:37"}
{"current_steps": 230, "total_steps": 375, "loss": 1.4825, "lr": 3.257139763390925e-05, "epoch": 0.6133333333333333, "percentage": 61.33, "elapsed_time": "0:26:56", "remaining_time": "0:16:59"}
{"current_steps": 230, "total_steps": 375, "eval_loss": 1.4740064144134521, "epoch": 0.6133333333333333, "percentage": 61.33, "elapsed_time": "0:27:37", "remaining_time": "0:17:25"}
{"current_steps": 240, "total_steps": 375, "loss": 1.4525, "lr": 2.8711035421746367e-05, "epoch": 0.64, "percentage": 64.0, "elapsed_time": "0:28:08", "remaining_time": "0:15:49"}
{"current_steps": 240, "total_steps": 375, "eval_loss": 1.47102689743042, "epoch": 0.64, "percentage": 64.0, "elapsed_time": "0:28:49", "remaining_time": "0:16:12"}
{"current_steps": 250, "total_steps": 375, "loss": 1.4794, "lr": 2.500000000000001e-05, "epoch": 0.6666666666666666, "percentage": 66.67, "elapsed_time": "0:29:21", "remaining_time": "0:14:40"}
{"current_steps": 250, "total_steps": 375, "eval_loss": 1.4680323600769043, "epoch": 0.6666666666666666, "percentage": 66.67, "elapsed_time": "0:30:01", "remaining_time": "0:15:00"}
{"current_steps": 260, "total_steps": 375, "loss": 1.4785, "lr": 2.1464321615778422e-05, "epoch": 0.6933333333333334, "percentage": 69.33, "elapsed_time": "0:30:32", "remaining_time": "0:13:30"}
{"current_steps": 260, "total_steps": 375, "eval_loss": 1.46550714969635, "epoch": 0.6933333333333334, "percentage": 69.33, "elapsed_time": "0:31:13", "remaining_time": "0:13:48"}
{"current_steps": 270, "total_steps": 375, "loss": 1.4523, "lr": 1.8128800512565513e-05, "epoch": 0.72, "percentage": 72.0, "elapsed_time": "0:31:44", "remaining_time": "0:12:20"}
{"current_steps": 270, "total_steps": 375, "eval_loss": 1.462823748588562, "epoch": 0.72, "percentage": 72.0, "elapsed_time": "0:32:24", "remaining_time": "0:12:36"}
{"current_steps": 280, "total_steps": 375, "loss": 1.4618, "lr": 1.5016832974331724e-05, "epoch": 0.7466666666666667, "percentage": 74.67, "elapsed_time": "0:32:56", "remaining_time": "0:11:10"}
{"current_steps": 280, "total_steps": 375, "eval_loss": 1.4604686498641968, "epoch": 0.7466666666666667, "percentage": 74.67, "elapsed_time": "0:33:37", "remaining_time": "0:11:24"}
{"current_steps": 290, "total_steps": 375, "loss": 1.4751, "lr": 1.2150247217412186e-05, "epoch": 0.7733333333333333, "percentage": 77.33, "elapsed_time": "0:34:10", "remaining_time": "0:10:01"}
{"current_steps": 290, "total_steps": 375, "eval_loss": 1.4580776691436768, "epoch": 0.7733333333333333, "percentage": 77.33, "elapsed_time": "0:34:51", "remaining_time": "0:10:13"}
{"current_steps": 300, "total_steps": 375, "loss": 1.4263, "lr": 9.549150281252633e-06, "epoch": 0.8, "percentage": 80.0, "elapsed_time": "0:35:22", "remaining_time": "0:08:50"}
{"current_steps": 300, "total_steps": 375, "eval_loss": 1.4561147689819336, "epoch": 0.8, "percentage": 80.0, "elapsed_time": "0:36:03", "remaining_time": "0:09:00"}
{"current_steps": 310, "total_steps": 375, "loss": 1.4421, "lr": 7.2317869919746705e-06, "epoch": 0.8266666666666667, "percentage": 82.67, "elapsed_time": "0:36:34", "remaining_time": "0:07:40"}
{"current_steps": 310, "total_steps": 375, "eval_loss": 1.4547889232635498, "epoch": 0.8266666666666667, "percentage": 82.67, "elapsed_time": "0:37:15", "remaining_time": "0:07:48"}
{"current_steps": 320, "total_steps": 375, "loss": 1.4824, "lr": 5.214411988029355e-06, "epoch": 0.8533333333333334, "percentage": 85.33, "elapsed_time": "0:37:45", "remaining_time": "0:06:29"}
{"current_steps": 320, "total_steps": 375, "eval_loss": 1.4539330005645752, "epoch": 0.8533333333333334, "percentage": 85.33, "elapsed_time": "0:38:26", "remaining_time": "0:06:36"}
{"current_steps": 330, "total_steps": 375, "loss": 1.4675, "lr": 3.511175705587433e-06, "epoch": 0.88, "percentage": 88.0, "elapsed_time": "0:38:57", "remaining_time": "0:05:18"}
{"current_steps": 330, "total_steps": 375, "eval_loss": 1.4530839920043945, "epoch": 0.88, "percentage": 88.0, "elapsed_time": "0:39:38", "remaining_time": "0:05:24"}
{"current_steps": 340, "total_steps": 375, "loss": 1.4891, "lr": 2.134025123396638e-06, "epoch": 0.9066666666666666, "percentage": 90.67, "elapsed_time": "0:40:09", "remaining_time": "0:04:08"}
{"current_steps": 340, "total_steps": 375, "eval_loss": 1.452470302581787, "epoch": 0.9066666666666666, "percentage": 90.67, "elapsed_time": "0:40:50", "remaining_time": "0:04:12"}
{"current_steps": 350, "total_steps": 375, "loss": 1.4617, "lr": 1.0926199633097157e-06, "epoch": 0.9333333333333333, "percentage": 93.33, "elapsed_time": "0:41:23", "remaining_time": "0:02:57"}
{"current_steps": 350, "total_steps": 375, "eval_loss": 1.4520126581192017, "epoch": 0.9333333333333333, "percentage": 93.33, "elapsed_time": "0:42:03", "remaining_time": "0:03:00"}
{"current_steps": 360, "total_steps": 375, "loss": 1.4404, "lr": 3.9426493427611177e-07, "epoch": 0.96, "percentage": 96.0, "elapsed_time": "0:42:35", "remaining_time": "0:01:46"}
{"current_steps": 360, "total_steps": 375, "eval_loss": 1.4521235227584839, "epoch": 0.96, "percentage": 96.0, "elapsed_time": "0:43:16", "remaining_time": "0:01:48"}
{"current_steps": 370, "total_steps": 375, "loss": 1.44, "lr": 4.385849505708084e-08, "epoch": 0.9866666666666667, "percentage": 98.67, "elapsed_time": "0:43:47", "remaining_time": "0:00:35"}
{"current_steps": 370, "total_steps": 375, "eval_loss": 1.4519704580307007, "epoch": 0.9866666666666667, "percentage": 98.67, "elapsed_time": "0:44:28", "remaining_time": "0:00:36"}
{"current_steps": 375, "total_steps": 375, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "0:44:44", "remaining_time": "0:00:00"}