oh_v1-2_only_camel_math / trainer_log.jsonl
esfrankel17's picture
Training in progress, epoch 2
e19c4a7 verified
{"current_steps": 10, "total_steps": 183, "loss": 0.5239, "learning_rate": 5e-06, "epoch": 0.16161616161616163, "percentage": 5.46, "elapsed_time": "0:05:24", "remaining_time": "1:33:29"}
{"current_steps": 20, "total_steps": 183, "loss": 0.4554, "learning_rate": 5e-06, "epoch": 0.32323232323232326, "percentage": 10.93, "elapsed_time": "0:10:40", "remaining_time": "1:26:58"}
{"current_steps": 30, "total_steps": 183, "loss": 0.4328, "learning_rate": 5e-06, "epoch": 0.48484848484848486, "percentage": 16.39, "elapsed_time": "0:15:56", "remaining_time": "1:21:17"}
{"current_steps": 40, "total_steps": 183, "loss": 0.4187, "learning_rate": 5e-06, "epoch": 0.6464646464646465, "percentage": 21.86, "elapsed_time": "0:21:11", "remaining_time": "1:15:45"}
{"current_steps": 50, "total_steps": 183, "loss": 0.4144, "learning_rate": 5e-06, "epoch": 0.8080808080808081, "percentage": 27.32, "elapsed_time": "0:26:26", "remaining_time": "1:10:20"}
{"current_steps": 60, "total_steps": 183, "loss": 0.4052, "learning_rate": 5e-06, "epoch": 0.9696969696969697, "percentage": 32.79, "elapsed_time": "0:31:43", "remaining_time": "1:05:02"}
{"current_steps": 61, "total_steps": 183, "eval_loss": 0.41120877861976624, "epoch": 0.9858585858585859, "percentage": 33.33, "elapsed_time": "0:33:25", "remaining_time": "1:06:51"}
{"current_steps": 70, "total_steps": 183, "loss": 0.3938, "learning_rate": 5e-06, "epoch": 1.1313131313131313, "percentage": 38.25, "elapsed_time": "0:38:51", "remaining_time": "1:02:43"}
{"current_steps": 80, "total_steps": 183, "loss": 0.3746, "learning_rate": 5e-06, "epoch": 1.2929292929292928, "percentage": 43.72, "elapsed_time": "0:44:07", "remaining_time": "0:56:48"}
{"current_steps": 90, "total_steps": 183, "loss": 0.3748, "learning_rate": 5e-06, "epoch": 1.4545454545454546, "percentage": 49.18, "elapsed_time": "0:49:21", "remaining_time": "0:51:00"}
{"current_steps": 100, "total_steps": 183, "loss": 0.3751, "learning_rate": 5e-06, "epoch": 1.6161616161616161, "percentage": 54.64, "elapsed_time": "0:54:38", "remaining_time": "0:45:20"}
{"current_steps": 110, "total_steps": 183, "loss": 0.3737, "learning_rate": 5e-06, "epoch": 1.7777777777777777, "percentage": 60.11, "elapsed_time": "0:59:53", "remaining_time": "0:39:44"}
{"current_steps": 120, "total_steps": 183, "loss": 0.3753, "learning_rate": 5e-06, "epoch": 1.9393939393939394, "percentage": 65.57, "elapsed_time": "1:05:08", "remaining_time": "0:34:11"}
{"current_steps": 123, "total_steps": 183, "eval_loss": 0.3987608253955841, "epoch": 1.9878787878787878, "percentage": 67.21, "elapsed_time": "1:07:45", "remaining_time": "0:33:03"}
{"current_steps": 130, "total_steps": 183, "loss": 0.36, "learning_rate": 5e-06, "epoch": 2.101010101010101, "percentage": 71.04, "elapsed_time": "1:12:06", "remaining_time": "0:29:23"}
{"current_steps": 140, "total_steps": 183, "loss": 0.3487, "learning_rate": 5e-06, "epoch": 2.2626262626262625, "percentage": 76.5, "elapsed_time": "1:17:21", "remaining_time": "0:23:45"}
{"current_steps": 150, "total_steps": 183, "loss": 0.348, "learning_rate": 5e-06, "epoch": 2.4242424242424243, "percentage": 81.97, "elapsed_time": "1:22:37", "remaining_time": "0:18:10"}
{"current_steps": 160, "total_steps": 183, "loss": 0.3508, "learning_rate": 5e-06, "epoch": 2.5858585858585856, "percentage": 87.43, "elapsed_time": "1:27:51", "remaining_time": "0:12:37"}
{"current_steps": 170, "total_steps": 183, "loss": 0.3486, "learning_rate": 5e-06, "epoch": 2.7474747474747474, "percentage": 92.9, "elapsed_time": "1:33:08", "remaining_time": "0:07:07"}
{"current_steps": 180, "total_steps": 183, "loss": 0.3467, "learning_rate": 5e-06, "epoch": 2.909090909090909, "percentage": 98.36, "elapsed_time": "1:38:23", "remaining_time": "0:01:38"}
{"current_steps": 183, "total_steps": 183, "eval_loss": 0.3988819718360901, "epoch": 2.9575757575757575, "percentage": 100.0, "elapsed_time": "1:41:45", "remaining_time": "0:00:00"}
{"current_steps": 183, "total_steps": 183, "epoch": 2.9575757575757575, "percentage": 100.0, "elapsed_time": "1:42:44", "remaining_time": "0:00:00"}