| {"current_steps": 10, "total_steps": 336, "loss": 0.2512, "learning_rate": 2.9411764705882354e-05, "epoch": 0.08888888888888889, "percentage": 2.98, "elapsed_time": "0:04:48", "remaining_time": "2:36:49", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 20, "total_steps": 336, "loss": 0.0734, "learning_rate": 5.882352941176471e-05, "epoch": 0.17777777777777778, "percentage": 5.95, "elapsed_time": "0:09:09", "remaining_time": "2:24:41", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 30, "total_steps": 336, "loss": 0.088, "learning_rate": 8.823529411764706e-05, "epoch": 0.26666666666666666, "percentage": 8.93, "elapsed_time": "0:13:40", "remaining_time": "2:19:28", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 40, "total_steps": 336, "loss": 0.0807, "learning_rate": 9.990263847374976e-05, "epoch": 0.35555555555555557, "percentage": 11.9, "elapsed_time": "0:18:20", "remaining_time": "2:15:42", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 50, "total_steps": 336, "loss": 0.0409, "learning_rate": 9.930902394260747e-05, "epoch": 0.4444444444444444, "percentage": 14.88, "elapsed_time": "0:22:39", "remaining_time": "2:09:35", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 60, "total_steps": 336, "loss": 0.0688, "learning_rate": 9.818229479678158e-05, "epoch": 0.5333333333333333, "percentage": 17.86, "elapsed_time": "0:27:17", "remaining_time": "2:05:34", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 70, "total_steps": 336, "loss": 0.0957, "learning_rate": 9.653463289927411e-05, "epoch": 0.6222222222222222, "percentage": 20.83, "elapsed_time": "0:31:59", "remaining_time": "2:01:34", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 80, "total_steps": 336, "loss": 0.0597, "learning_rate": 9.438385228425938e-05, "epoch": 0.7111111111111111, "percentage": 23.81, "elapsed_time": "0:36:26", "remaining_time": "1:56:36", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 90, "total_steps": 336, "loss": 0.0597, "learning_rate": 9.175320655700406e-05, "epoch": 0.8, "percentage": 26.79, "elapsed_time": "0:40:55", "remaining_time": "1:51:51", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 100, "total_steps": 336, "loss": 0.0873, "learning_rate": 8.86711374827494e-05, "epoch": 0.8888888888888888, "percentage": 29.76, "elapsed_time": "0:45:50", "remaining_time": "1:48:11", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 110, "total_steps": 336, "loss": 0.081, "learning_rate": 8.517096748273951e-05, "epoch": 0.9777777777777777, "percentage": 32.74, "elapsed_time": "0:50:28", "remaining_time": "1:43:41", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 120, "total_steps": 336, "loss": 0.0815, "learning_rate": 8.129053936203687e-05, "epoch": 1.0666666666666667, "percentage": 35.71, "elapsed_time": "0:55:23", "remaining_time": "1:39:43", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 130, "total_steps": 336, "loss": 0.0279, "learning_rate": 7.707180716428237e-05, "epoch": 1.1555555555555554, "percentage": 38.69, "elapsed_time": "0:59:43", "remaining_time": "1:34:38", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 140, "total_steps": 336, "loss": 0.0281, "learning_rate": 7.256038257695687e-05, "epoch": 1.2444444444444445, "percentage": 41.67, "elapsed_time": "1:04:29", "remaining_time": "1:30:17", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 150, "total_steps": 336, "loss": 0.0337, "learning_rate": 6.780504179127734e-05, "epoch": 1.3333333333333333, "percentage": 44.64, "elapsed_time": "1:09:15", "remaining_time": "1:25:52", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 160, "total_steps": 336, "loss": 0.0279, "learning_rate": 6.28571981484123e-05, "epoch": 1.4222222222222223, "percentage": 47.62, "elapsed_time": "1:13:33", "remaining_time": "1:20:55", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 170, "total_steps": 336, "loss": 0.038, "learning_rate": 5.7770346273610254e-05, "epoch": 1.511111111111111, "percentage": 50.6, "elapsed_time": "1:18:15", "remaining_time": "1:16:24", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 180, "total_steps": 336, "loss": 0.0277, "learning_rate": 5.2599483708099016e-05, "epoch": 1.6, "percentage": 53.57, "elapsed_time": "1:22:54", "remaining_time": "1:11:51", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 190, "total_steps": 336, "loss": 0.0274, "learning_rate": 4.740051629190099e-05, "epoch": 1.6888888888888889, "percentage": 56.55, "elapsed_time": "1:27:16", "remaining_time": "1:07:04", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 200, "total_steps": 336, "loss": 0.0213, "learning_rate": 4.2229653726389765e-05, "epoch": 1.7777777777777777, "percentage": 59.52, "elapsed_time": "1:31:41", "remaining_time": "1:02:21", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 210, "total_steps": 336, "loss": 0.0229, "learning_rate": 3.714280185158771e-05, "epoch": 1.8666666666666667, "percentage": 62.5, "elapsed_time": "1:36:20", "remaining_time": "0:57:48", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 220, "total_steps": 336, "loss": 0.0241, "learning_rate": 3.219495820872265e-05, "epoch": 1.9555555555555557, "percentage": 65.48, "elapsed_time": "1:41:16", "remaining_time": "0:53:23", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 230, "total_steps": 336, "loss": 0.033, "learning_rate": 2.7439617423043145e-05, "epoch": 2.0444444444444443, "percentage": 68.45, "elapsed_time": "1:46:06", "remaining_time": "0:48:54", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 240, "total_steps": 336, "loss": 0.0076, "learning_rate": 2.2928192835717644e-05, "epoch": 2.1333333333333333, "percentage": 71.43, "elapsed_time": "1:50:23", "remaining_time": "0:44:09", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 250, "total_steps": 336, "loss": 0.0089, "learning_rate": 1.8709460637963123e-05, "epoch": 2.2222222222222223, "percentage": 74.4, "elapsed_time": "1:55:00", "remaining_time": "0:39:33", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 260, "total_steps": 336, "loss": 0.0099, "learning_rate": 1.4829032517260489e-05, "epoch": 2.311111111111111, "percentage": 77.38, "elapsed_time": "1:59:29", "remaining_time": "0:34:55", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 270, "total_steps": 336, "loss": 0.0116, "learning_rate": 1.132886251725061e-05, "epoch": 2.4, "percentage": 80.36, "elapsed_time": "2:04:14", "remaining_time": "0:30:22", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 280, "total_steps": 336, "loss": 0.0084, "learning_rate": 8.246793442995954e-06, "epoch": 2.488888888888889, "percentage": 83.33, "elapsed_time": "2:08:32", "remaining_time": "0:25:42", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 290, "total_steps": 336, "loss": 0.0116, "learning_rate": 5.616147715740611e-06, "epoch": 2.5777777777777775, "percentage": 86.31, "elapsed_time": "2:13:02", "remaining_time": "0:21:06", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 300, "total_steps": 336, "loss": 0.0099, "learning_rate": 3.465367100725908e-06, "epoch": 2.6666666666666665, "percentage": 89.29, "elapsed_time": "2:18:01", "remaining_time": "0:16:33", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 310, "total_steps": 336, "loss": 0.0089, "learning_rate": 1.8177052032184283e-06, "epoch": 2.7555555555555555, "percentage": 92.26, "elapsed_time": "2:22:33", "remaining_time": "0:11:57", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 320, "total_steps": 336, "loss": 0.0072, "learning_rate": 6.909760573925561e-07, "epoch": 2.8444444444444446, "percentage": 95.24, "elapsed_time": "2:26:57", "remaining_time": "0:07:20", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 330, "total_steps": 336, "loss": 0.0072, "learning_rate": 9.73615262502503e-08, "epoch": 2.9333333333333336, "percentage": 98.21, "elapsed_time": "2:31:37", "remaining_time": "0:02:45", "throughput": "0.00", "total_tokens": 0} |
| {"current_steps": 336, "total_steps": 336, "epoch": 2.986666666666667, "percentage": 100.0, "elapsed_time": "2:34:46", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} |
|
|