taskmaster2-3k-traces / trainer_log.jsonl
penfever's picture
Model save
75adc52 verified
{"current_steps": 5, "total_steps": 250, "loss": 0.768, "lr": 6.4000000000000006e-06, "epoch": 0.10101010101010101, "percentage": 2.0, "elapsed_time": "0:02:01", "remaining_time": "1:39:19"}
{"current_steps": 10, "total_steps": 250, "loss": 0.6809, "lr": 1.4400000000000001e-05, "epoch": 0.20202020202020202, "percentage": 4.0, "elapsed_time": "0:03:49", "remaining_time": "1:31:36"}
{"current_steps": 15, "total_steps": 250, "loss": 0.6367, "lr": 2.2400000000000002e-05, "epoch": 0.30303030303030304, "percentage": 6.0, "elapsed_time": "0:05:30", "remaining_time": "1:26:22"}
{"current_steps": 20, "total_steps": 250, "loss": 0.603, "lr": 3.0400000000000004e-05, "epoch": 0.40404040404040403, "percentage": 8.0, "elapsed_time": "0:07:21", "remaining_time": "1:24:38"}
{"current_steps": 25, "total_steps": 250, "loss": 0.5739, "lr": 3.8400000000000005e-05, "epoch": 0.5050505050505051, "percentage": 10.0, "elapsed_time": "0:09:13", "remaining_time": "1:23:05"}
{"current_steps": 30, "total_steps": 250, "loss": 0.531, "lr": 3.9968815283639625e-05, "epoch": 0.6060606060606061, "percentage": 12.0, "elapsed_time": "0:11:07", "remaining_time": "1:21:35"}
{"current_steps": 35, "total_steps": 250, "loss": 0.5137, "lr": 3.9842294026289565e-05, "epoch": 0.7070707070707071, "percentage": 14.0, "elapsed_time": "0:12:59", "remaining_time": "1:19:48"}
{"current_steps": 40, "total_steps": 250, "loss": 0.5033, "lr": 3.9619103106983835e-05, "epoch": 0.8080808080808081, "percentage": 16.0, "elapsed_time": "0:14:50", "remaining_time": "1:17:53"}
{"current_steps": 45, "total_steps": 250, "loss": 0.4921, "lr": 3.930032988944623e-05, "epoch": 0.9090909090909091, "percentage": 18.0, "elapsed_time": "0:16:37", "remaining_time": "1:15:44"}
{"current_steps": 50, "total_steps": 250, "loss": 0.4725, "lr": 3.888752740474962e-05, "epoch": 1.0, "percentage": 20.0, "elapsed_time": "0:18:16", "remaining_time": "1:13:05"}
{"current_steps": 55, "total_steps": 250, "loss": 0.4631, "lr": 3.838270678510469e-05, "epoch": 1.101010101010101, "percentage": 22.0, "elapsed_time": "0:20:10", "remaining_time": "1:11:30"}
{"current_steps": 60, "total_steps": 250, "loss": 0.4695, "lr": 3.778832746582596e-05, "epoch": 1.202020202020202, "percentage": 24.0, "elapsed_time": "0:21:54", "remaining_time": "1:09:23"}
{"current_steps": 65, "total_steps": 250, "loss": 0.4622, "lr": 3.710728520321014e-05, "epoch": 1.303030303030303, "percentage": 26.0, "elapsed_time": "0:23:44", "remaining_time": "1:07:34"}
{"current_steps": 70, "total_steps": 250, "loss": 0.4639, "lr": 3.634289796670257e-05, "epoch": 1.404040404040404, "percentage": 28.0, "elapsed_time": "0:25:33", "remaining_time": "1:05:43"}
{"current_steps": 75, "total_steps": 250, "loss": 0.4547, "lr": 3.549888977408359e-05, "epoch": 1.5050505050505052, "percentage": 30.0, "elapsed_time": "0:27:21", "remaining_time": "1:03:50"}
{"current_steps": 80, "total_steps": 250, "loss": 0.4478, "lr": 3.457937254842823e-05, "epoch": 1.606060606060606, "percentage": 32.0, "elapsed_time": "0:29:06", "remaining_time": "1:01:51"}
{"current_steps": 85, "total_steps": 250, "loss": 0.4405, "lr": 3.3588826085230336e-05, "epoch": 1.7070707070707072, "percentage": 34.0, "elapsed_time": "0:30:55", "remaining_time": "1:00:02"}
{"current_steps": 90, "total_steps": 250, "loss": 0.441, "lr": 3.253207622728921e-05, "epoch": 1.808080808080808, "percentage": 36.0, "elapsed_time": "0:32:45", "remaining_time": "0:58:13"}
{"current_steps": 95, "total_steps": 250, "loss": 0.4447, "lr": 3.141427135368864e-05, "epoch": 1.9090909090909092, "percentage": 38.0, "elapsed_time": "0:34:32", "remaining_time": "0:56:21"}
{"current_steps": 100, "total_steps": 250, "loss": 0.4481, "lr": 3.024085729741143e-05, "epoch": 2.0, "percentage": 40.0, "elapsed_time": "0:36:09", "remaining_time": "0:54:14"}
{"current_steps": 105, "total_steps": 250, "loss": 0.4286, "lr": 2.9017550813788616e-05, "epoch": 2.101010101010101, "percentage": 42.0, "elapsed_time": "0:37:56", "remaining_time": "0:52:23"}
{"current_steps": 110, "total_steps": 250, "loss": 0.4249, "lr": 2.7750311729042062e-05, "epoch": 2.202020202020202, "percentage": 44.0, "elapsed_time": "0:39:51", "remaining_time": "0:50:43"}
{"current_steps": 115, "total_steps": 250, "loss": 0.4319, "lr": 2.6445313904610227e-05, "epoch": 2.303030303030303, "percentage": 46.0, "elapsed_time": "0:41:40", "remaining_time": "0:48:55"}
{"current_steps": 120, "total_steps": 250, "loss": 0.4335, "lr": 2.510891515871581e-05, "epoch": 2.404040404040404, "percentage": 48.0, "elapsed_time": "0:43:26", "remaining_time": "0:47:03"}
{"current_steps": 125, "total_steps": 250, "loss": 0.4247, "lr": 2.37476262917145e-05, "epoch": 2.505050505050505, "percentage": 50.0, "elapsed_time": "0:45:16", "remaining_time": "0:45:16"}
{"current_steps": 130, "total_steps": 250, "loss": 0.4187, "lr": 2.2368079366130028e-05, "epoch": 2.606060606060606, "percentage": 52.0, "elapsed_time": "0:47:03", "remaining_time": "0:43:26"}
{"current_steps": 135, "total_steps": 250, "loss": 0.4274, "lr": 2.097699539591227e-05, "epoch": 2.707070707070707, "percentage": 54.0, "elapsed_time": "0:48:45", "remaining_time": "0:41:32"}
{"current_steps": 140, "total_steps": 250, "loss": 0.4177, "lr": 1.9581151602332865e-05, "epoch": 2.808080808080808, "percentage": 56.0, "elapsed_time": "0:50:29", "remaining_time": "0:39:40"}
{"current_steps": 145, "total_steps": 250, "loss": 0.4231, "lr": 1.8187348396044402e-05, "epoch": 2.909090909090909, "percentage": 58.0, "elapsed_time": "0:52:15", "remaining_time": "0:37:50"}
{"current_steps": 150, "total_steps": 250, "loss": 0.4307, "lr": 1.6802376246163307e-05, "epoch": 3.0, "percentage": 60.0, "elapsed_time": "0:54:01", "remaining_time": "0:36:01"}
{"current_steps": 155, "total_steps": 250, "loss": 0.4228, "lr": 1.5432982597786886e-05, "epoch": 3.101010101010101, "percentage": 62.0, "elapsed_time": "0:55:51", "remaining_time": "0:34:13"}
{"current_steps": 160, "total_steps": 250, "loss": 0.4183, "lr": 1.4085838999119075e-05, "epoch": 3.202020202020202, "percentage": 64.0, "elapsed_time": "0:57:36", "remaining_time": "0:32:24"}
{"current_steps": 165, "total_steps": 250, "loss": 0.4119, "lr": 1.2767508598358158e-05, "epoch": 3.303030303030303, "percentage": 66.0, "elapsed_time": "0:59:34", "remaining_time": "0:30:41"}
{"current_steps": 170, "total_steps": 250, "loss": 0.4109, "lr": 1.1484414168698547e-05, "epoch": 3.404040404040404, "percentage": 68.0, "elapsed_time": "1:01:22", "remaining_time": "0:28:52"}
{"current_steps": 175, "total_steps": 250, "loss": 0.4183, "lr": 1.0242806817225344e-05, "epoch": 3.505050505050505, "percentage": 70.0, "elapsed_time": "1:03:13", "remaining_time": "0:27:05"}
{"current_steps": 180, "total_steps": 250, "loss": 0.4057, "lr": 9.048735530148998e-06, "epoch": 3.606060606060606, "percentage": 72.0, "elapsed_time": "1:05:00", "remaining_time": "0:25:16"}
{"current_steps": 185, "total_steps": 250, "loss": 0.4167, "lr": 7.908017702752504e-06, "epoch": 3.707070707070707, "percentage": 74.0, "elapsed_time": "1:06:41", "remaining_time": "0:23:26"}
{"current_steps": 190, "total_steps": 250, "loss": 0.4158, "lr": 6.826210797626389e-06, "epoch": 3.808080808080808, "percentage": 76.0, "elapsed_time": "1:08:30", "remaining_time": "0:21:37"}
{"current_steps": 195, "total_steps": 250, "loss": 0.4088, "lr": 5.8085852692695864e-06, "epoch": 3.909090909090909, "percentage": 78.0, "elapsed_time": "1:10:15", "remaining_time": "0:19:49"}
{"current_steps": 200, "total_steps": 250, "loss": 0.4077, "lr": 4.8600988869648745e-06, "epoch": 4.0, "percentage": 80.0, "elapsed_time": "1:11:54", "remaining_time": "0:17:58"}
{"current_steps": 205, "total_steps": 250, "loss": 0.3992, "lr": 3.985372581025333e-06, "epoch": 4.101010101010101, "percentage": 82.0, "elapsed_time": "1:13:40", "remaining_time": "0:16:10"}
{"current_steps": 210, "total_steps": 250, "loss": 0.407, "lr": 3.1886679300863156e-06, "epoch": 4.202020202020202, "percentage": 84.0, "elapsed_time": "1:15:30", "remaining_time": "0:14:22"}
{"current_steps": 215, "total_steps": 250, "loss": 0.4133, "lr": 2.473866399122733e-06, "epoch": 4.303030303030303, "percentage": 86.0, "elapsed_time": "1:17:19", "remaining_time": "0:12:35"}
{"current_steps": 220, "total_steps": 250, "loss": 0.4124, "lr": 1.8444504293418286e-06, "epoch": 4.404040404040404, "percentage": 88.0, "elapsed_time": "1:19:10", "remaining_time": "0:10:47"}
{"current_steps": 225, "total_steps": 250, "loss": 0.4125, "lr": 1.3034864720797112e-06, "epoch": 4.505050505050505, "percentage": 90.0, "elapsed_time": "1:20:56", "remaining_time": "0:08:59"}
{"current_steps": 230, "total_steps": 250, "loss": 0.4023, "lr": 8.536100493586552e-07, "epoch": 4.606060606060606, "percentage": 92.0, "elapsed_time": "1:22:40", "remaining_time": "0:07:11"}
{"current_steps": 235, "total_steps": 250, "loss": 0.4078, "lr": 4.970129138887347e-07, "epoch": 4.707070707070707, "percentage": 94.0, "elapsed_time": "1:24:32", "remaining_time": "0:05:23"}
{"current_steps": 240, "total_steps": 250, "loss": 0.4138, "lr": 2.3543237106894434e-07, "epoch": 4.808080808080808, "percentage": 96.0, "elapsed_time": "1:26:19", "remaining_time": "0:03:35"}
{"current_steps": 245, "total_steps": 250, "loss": 0.4099, "lr": 7.01428150099126e-08, "epoch": 4.909090909090909, "percentage": 98.0, "elapsed_time": "1:28:05", "remaining_time": "0:01:47"}
{"current_steps": 250, "total_steps": 250, "loss": 0.4103, "lr": 1.949519813915224e-09, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "1:29:41", "remaining_time": "0:00:00"}
{"current_steps": 250, "total_steps": 250, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "1:29:41", "remaining_time": "0:00:00"}