OH_original_wo_platypus / trainer_log.jsonl
sedrickkeh's picture
Training in progress, epoch 0
9eff072 verified
{"current_steps": 10, "total_steps": 984, "loss": 0.801, "learning_rate": 5e-06, "epoch": 0.030441400304414, "percentage": 1.02, "elapsed_time": "0:04:55", "remaining_time": "8:00:01"}
{"current_steps": 20, "total_steps": 984, "loss": 0.7282, "learning_rate": 5e-06, "epoch": 0.060882800608828, "percentage": 2.03, "elapsed_time": "0:09:48", "remaining_time": "7:52:31"}
{"current_steps": 30, "total_steps": 984, "loss": 0.7045, "learning_rate": 5e-06, "epoch": 0.091324200913242, "percentage": 3.05, "elapsed_time": "0:14:39", "remaining_time": "7:46:15"}
{"current_steps": 40, "total_steps": 984, "loss": 0.6875, "learning_rate": 5e-06, "epoch": 0.121765601217656, "percentage": 4.07, "elapsed_time": "0:19:31", "remaining_time": "7:40:55"}
{"current_steps": 50, "total_steps": 984, "loss": 0.6818, "learning_rate": 5e-06, "epoch": 0.15220700152207, "percentage": 5.08, "elapsed_time": "0:24:24", "remaining_time": "7:35:53"}
{"current_steps": 60, "total_steps": 984, "loss": 0.6695, "learning_rate": 5e-06, "epoch": 0.182648401826484, "percentage": 6.1, "elapsed_time": "0:29:16", "remaining_time": "7:30:55"}
{"current_steps": 70, "total_steps": 984, "loss": 0.6519, "learning_rate": 5e-06, "epoch": 0.213089802130898, "percentage": 7.11, "elapsed_time": "0:34:09", "remaining_time": "7:26:01"}
{"current_steps": 80, "total_steps": 984, "loss": 0.6423, "learning_rate": 5e-06, "epoch": 0.243531202435312, "percentage": 8.13, "elapsed_time": "0:39:02", "remaining_time": "7:21:07"}
{"current_steps": 90, "total_steps": 984, "loss": 0.6501, "learning_rate": 5e-06, "epoch": 0.273972602739726, "percentage": 9.15, "elapsed_time": "0:43:54", "remaining_time": "7:16:14"}
{"current_steps": 100, "total_steps": 984, "loss": 0.6403, "learning_rate": 5e-06, "epoch": 0.30441400304414, "percentage": 10.16, "elapsed_time": "0:48:47", "remaining_time": "7:11:19"}
{"current_steps": 110, "total_steps": 984, "loss": 0.6327, "learning_rate": 5e-06, "epoch": 0.334855403348554, "percentage": 11.18, "elapsed_time": "0:53:39", "remaining_time": "7:06:23"}
{"current_steps": 120, "total_steps": 984, "loss": 0.6311, "learning_rate": 5e-06, "epoch": 0.365296803652968, "percentage": 12.2, "elapsed_time": "0:58:32", "remaining_time": "7:01:31"}
{"current_steps": 130, "total_steps": 984, "loss": 0.6383, "learning_rate": 5e-06, "epoch": 0.395738203957382, "percentage": 13.21, "elapsed_time": "1:03:25", "remaining_time": "6:56:38"}
{"current_steps": 140, "total_steps": 984, "loss": 0.6289, "learning_rate": 5e-06, "epoch": 0.426179604261796, "percentage": 14.23, "elapsed_time": "1:08:18", "remaining_time": "6:51:45"}
{"current_steps": 150, "total_steps": 984, "loss": 0.6315, "learning_rate": 5e-06, "epoch": 0.45662100456621, "percentage": 15.24, "elapsed_time": "1:13:10", "remaining_time": "6:46:52"}
{"current_steps": 160, "total_steps": 984, "loss": 0.6292, "learning_rate": 5e-06, "epoch": 0.487062404870624, "percentage": 16.26, "elapsed_time": "1:18:03", "remaining_time": "6:41:59"}
{"current_steps": 170, "total_steps": 984, "loss": 0.6274, "learning_rate": 5e-06, "epoch": 0.517503805175038, "percentage": 17.28, "elapsed_time": "1:22:56", "remaining_time": "6:37:06"}
{"current_steps": 180, "total_steps": 984, "loss": 0.6147, "learning_rate": 5e-06, "epoch": 0.547945205479452, "percentage": 18.29, "elapsed_time": "1:27:48", "remaining_time": "6:32:14"}
{"current_steps": 190, "total_steps": 984, "loss": 0.6214, "learning_rate": 5e-06, "epoch": 0.578386605783866, "percentage": 19.31, "elapsed_time": "1:32:41", "remaining_time": "6:27:22"}
{"current_steps": 200, "total_steps": 984, "loss": 0.6211, "learning_rate": 5e-06, "epoch": 0.60882800608828, "percentage": 20.33, "elapsed_time": "1:37:33", "remaining_time": "6:22:26"}
{"current_steps": 210, "total_steps": 984, "loss": 0.6269, "learning_rate": 5e-06, "epoch": 0.639269406392694, "percentage": 21.34, "elapsed_time": "1:42:26", "remaining_time": "6:17:34"}
{"current_steps": 220, "total_steps": 984, "loss": 0.6186, "learning_rate": 5e-06, "epoch": 0.669710806697108, "percentage": 22.36, "elapsed_time": "1:47:19", "remaining_time": "6:12:41"}
{"current_steps": 230, "total_steps": 984, "loss": 0.6174, "learning_rate": 5e-06, "epoch": 0.700152207001522, "percentage": 23.37, "elapsed_time": "1:52:11", "remaining_time": "6:07:48"}
{"current_steps": 240, "total_steps": 984, "loss": 0.6157, "learning_rate": 5e-06, "epoch": 0.730593607305936, "percentage": 24.39, "elapsed_time": "1:57:03", "remaining_time": "6:02:53"}
{"current_steps": 250, "total_steps": 984, "loss": 0.6119, "learning_rate": 5e-06, "epoch": 0.76103500761035, "percentage": 25.41, "elapsed_time": "2:01:55", "remaining_time": "5:57:58"}
{"current_steps": 260, "total_steps": 984, "loss": 0.6174, "learning_rate": 5e-06, "epoch": 0.791476407914764, "percentage": 26.42, "elapsed_time": "2:06:47", "remaining_time": "5:53:04"}
{"current_steps": 270, "total_steps": 984, "loss": 0.6115, "learning_rate": 5e-06, "epoch": 0.821917808219178, "percentage": 27.44, "elapsed_time": "2:11:39", "remaining_time": "5:48:10"}
{"current_steps": 280, "total_steps": 984, "loss": 0.618, "learning_rate": 5e-06, "epoch": 0.852359208523592, "percentage": 28.46, "elapsed_time": "2:16:32", "remaining_time": "5:43:18"}
{"current_steps": 290, "total_steps": 984, "loss": 0.6141, "learning_rate": 5e-06, "epoch": 0.882800608828006, "percentage": 29.47, "elapsed_time": "2:21:25", "remaining_time": "5:38:26"}
{"current_steps": 300, "total_steps": 984, "loss": 0.61, "learning_rate": 5e-06, "epoch": 0.91324200913242, "percentage": 30.49, "elapsed_time": "2:26:18", "remaining_time": "5:33:34"}
{"current_steps": 310, "total_steps": 984, "loss": 0.6086, "learning_rate": 5e-06, "epoch": 0.943683409436834, "percentage": 31.5, "elapsed_time": "2:31:10", "remaining_time": "5:28:41"}
{"current_steps": 320, "total_steps": 984, "loss": 0.6134, "learning_rate": 5e-06, "epoch": 0.974124809741248, "percentage": 32.52, "elapsed_time": "2:36:03", "remaining_time": "5:23:48"}
{"current_steps": 328, "total_steps": 984, "eval_loss": 0.6086177825927734, "epoch": 0.9984779299847792, "percentage": 33.33, "elapsed_time": "2:43:08", "remaining_time": "5:26:17"}
{"current_steps": 330, "total_steps": 984, "loss": 0.6066, "learning_rate": 5e-06, "epoch": 1.004566210045662, "percentage": 33.54, "elapsed_time": "2:44:49", "remaining_time": "5:26:39"}