jdqqjr's picture
Upload folder using huggingface_hub
de29f71 verified
{"current_steps": 10, "total_steps": 500, "loss": 16.6271, "learning_rate": 9.996447363202946e-05, "epoch": 0.08, "percentage": 2.0, "elapsed_time": "0:00:24", "remaining_time": "0:19:39"}
{"current_steps": 20, "total_steps": 500, "loss": 13.6217, "learning_rate": 9.977809823015401e-05, "epoch": 0.16, "percentage": 4.0, "elapsed_time": "0:00:47", "remaining_time": "0:19:02"}
{"current_steps": 30, "total_steps": 500, "loss": 12.3656, "learning_rate": 9.938441702975689e-05, "epoch": 0.24, "percentage": 6.0, "elapsed_time": "0:01:11", "remaining_time": "0:18:33"}
{"current_steps": 40, "total_steps": 500, "loss": 12.2646, "learning_rate": 9.879583809693738e-05, "epoch": 0.32, "percentage": 8.0, "elapsed_time": "0:01:35", "remaining_time": "0:18:12"}
{"current_steps": 50, "total_steps": 500, "loss": 12.1808, "learning_rate": 9.801468428384716e-05, "epoch": 0.4, "percentage": 10.0, "elapsed_time": "0:01:58", "remaining_time": "0:17:49"}
{"current_steps": 60, "total_steps": 500, "loss": 12.1502, "learning_rate": 9.704403844771128e-05, "epoch": 0.48, "percentage": 12.0, "elapsed_time": "0:02:22", "remaining_time": "0:17:26"}
{"current_steps": 70, "total_steps": 500, "loss": 11.9683, "learning_rate": 9.588773128419906e-05, "epoch": 0.56, "percentage": 14.0, "elapsed_time": "0:02:46", "remaining_time": "0:17:05"}
{"current_steps": 80, "total_steps": 500, "loss": 11.8564, "learning_rate": 9.45503262094184e-05, "epoch": 0.64, "percentage": 16.0, "elapsed_time": "0:03:10", "remaining_time": "0:16:41"}
{"current_steps": 90, "total_steps": 500, "loss": 12.0212, "learning_rate": 9.30371013501972e-05, "epoch": 0.72, "percentage": 18.0, "elapsed_time": "0:03:35", "remaining_time": "0:16:20"}
{"current_steps": 100, "total_steps": 500, "loss": 11.8631, "learning_rate": 9.135402871372808e-05, "epoch": 0.8, "percentage": 20.0, "elapsed_time": "0:03:59", "remaining_time": "0:15:56"}
{"current_steps": 110, "total_steps": 500, "loss": 11.6954, "learning_rate": 8.950775061878453e-05, "epoch": 0.88, "percentage": 22.0, "elapsed_time": "0:04:23", "remaining_time": "0:15:33"}
{"current_steps": 120, "total_steps": 500, "loss": 11.7669, "learning_rate": 8.750555348152298e-05, "epoch": 0.96, "percentage": 24.0, "elapsed_time": "0:04:47", "remaining_time": "0:15:10"}
{"current_steps": 130, "total_steps": 500, "loss": 10.3003, "learning_rate": 8.535533905932738e-05, "epoch": 1.04, "percentage": 26.0, "elapsed_time": "0:05:11", "remaining_time": "0:14:46"}
{"current_steps": 140, "total_steps": 500, "loss": 8.5731, "learning_rate": 8.306559326618259e-05, "epoch": 1.12, "percentage": 28.0, "elapsed_time": "0:05:35", "remaining_time": "0:14:23"}
{"current_steps": 150, "total_steps": 500, "loss": 8.5948, "learning_rate": 8.064535268264883e-05, "epoch": 1.2, "percentage": 30.0, "elapsed_time": "0:06:00", "remaining_time": "0:14:00"}
{"current_steps": 160, "total_steps": 500, "loss": 8.656, "learning_rate": 7.810416889260653e-05, "epoch": 1.28, "percentage": 32.0, "elapsed_time": "0:06:24", "remaining_time": "0:13:37"}
{"current_steps": 170, "total_steps": 500, "loss": 8.7269, "learning_rate": 7.545207078751857e-05, "epoch": 1.3599999999999999, "percentage": 34.0, "elapsed_time": "0:06:49", "remaining_time": "0:13:14"}
{"current_steps": 180, "total_steps": 500, "loss": 8.6868, "learning_rate": 7.269952498697734e-05, "epoch": 1.44, "percentage": 36.0, "elapsed_time": "0:07:13", "remaining_time": "0:12:50"}
{"current_steps": 190, "total_steps": 500, "loss": 8.7702, "learning_rate": 6.985739453173903e-05, "epoch": 1.52, "percentage": 38.0, "elapsed_time": "0:07:37", "remaining_time": "0:12:26"}
{"current_steps": 200, "total_steps": 500, "loss": 8.7521, "learning_rate": 6.693689601226458e-05, "epoch": 1.6, "percentage": 40.0, "elapsed_time": "0:08:01", "remaining_time": "0:12:02"}
{"current_steps": 210, "total_steps": 500, "loss": 8.8742, "learning_rate": 6.394955530196147e-05, "epoch": 1.6800000000000002, "percentage": 42.0, "elapsed_time": "0:08:25", "remaining_time": "0:11:38"}
{"current_steps": 220, "total_steps": 500, "loss": 8.7707, "learning_rate": 6.090716206982714e-05, "epoch": 1.76, "percentage": 44.0, "elapsed_time": "0:08:49", "remaining_time": "0:11:14"}
{"current_steps": 230, "total_steps": 500, "loss": 8.7433, "learning_rate": 5.782172325201155e-05, "epoch": 1.8399999999999999, "percentage": 46.0, "elapsed_time": "0:09:13", "remaining_time": "0:10:50"}
{"current_steps": 240, "total_steps": 500, "loss": 8.7179, "learning_rate": 5.470541566592573e-05, "epoch": 1.92, "percentage": 48.0, "elapsed_time": "0:09:38", "remaining_time": "0:10:26"}
{"current_steps": 250, "total_steps": 500, "loss": 8.6486, "learning_rate": 5.157053795390642e-05, "epoch": 2.0, "percentage": 50.0, "elapsed_time": "0:10:02", "remaining_time": "0:10:02"}
{"current_steps": 260, "total_steps": 500, "loss": 5.591, "learning_rate": 4.8429462046093585e-05, "epoch": 2.08, "percentage": 52.0, "elapsed_time": "0:10:26", "remaining_time": "0:09:38"}
{"current_steps": 270, "total_steps": 500, "loss": 5.4084, "learning_rate": 4.529458433407429e-05, "epoch": 2.16, "percentage": 54.0, "elapsed_time": "0:10:50", "remaining_time": "0:09:14"}
{"current_steps": 280, "total_steps": 500, "loss": 5.3605, "learning_rate": 4.2178276747988446e-05, "epoch": 2.24, "percentage": 56.0, "elapsed_time": "0:11:14", "remaining_time": "0:08:50"}
{"current_steps": 290, "total_steps": 500, "loss": 5.3401, "learning_rate": 3.9092837930172884e-05, "epoch": 2.32, "percentage": 58.0, "elapsed_time": "0:11:39", "remaining_time": "0:08:26"}
{"current_steps": 300, "total_steps": 500, "loss": 5.3064, "learning_rate": 3.605044469803854e-05, "epoch": 2.4, "percentage": 60.0, "elapsed_time": "0:12:03", "remaining_time": "0:08:02"}
{"current_steps": 310, "total_steps": 500, "loss": 5.3187, "learning_rate": 3.3063103987735433e-05, "epoch": 2.48, "percentage": 62.0, "elapsed_time": "0:12:27", "remaining_time": "0:07:38"}
{"current_steps": 320, "total_steps": 500, "loss": 5.413, "learning_rate": 3.0142605468260978e-05, "epoch": 2.56, "percentage": 64.0, "elapsed_time": "0:12:52", "remaining_time": "0:07:14"}
{"current_steps": 330, "total_steps": 500, "loss": 5.2867, "learning_rate": 2.7300475013022663e-05, "epoch": 2.64, "percentage": 66.0, "elapsed_time": "0:13:16", "remaining_time": "0:06:50"}
{"current_steps": 340, "total_steps": 500, "loss": 5.3684, "learning_rate": 2.4547929212481435e-05, "epoch": 2.7199999999999998, "percentage": 68.0, "elapsed_time": "0:13:40", "remaining_time": "0:06:26"}
{"current_steps": 350, "total_steps": 500, "loss": 5.3484, "learning_rate": 2.1895831107393484e-05, "epoch": 2.8, "percentage": 70.0, "elapsed_time": "0:14:05", "remaining_time": "0:06:02"}
{"current_steps": 360, "total_steps": 500, "loss": 5.2971, "learning_rate": 1.9354647317351188e-05, "epoch": 2.88, "percentage": 72.0, "elapsed_time": "0:14:29", "remaining_time": "0:05:38"}
{"current_steps": 370, "total_steps": 500, "loss": 5.2595, "learning_rate": 1.6934406733817414e-05, "epoch": 2.96, "percentage": 74.0, "elapsed_time": "0:14:53", "remaining_time": "0:05:14"}
{"current_steps": 380, "total_steps": 500, "loss": 4.2182, "learning_rate": 1.4644660940672627e-05, "epoch": 3.04, "percentage": 76.0, "elapsed_time": "0:15:18", "remaining_time": "0:04:50"}
{"current_steps": 390, "total_steps": 500, "loss": 3.1071, "learning_rate": 1.2494446518477022e-05, "epoch": 3.12, "percentage": 78.0, "elapsed_time": "0:15:43", "remaining_time": "0:04:25"}
{"current_steps": 400, "total_steps": 500, "loss": 3.068, "learning_rate": 1.049224938121548e-05, "epoch": 3.2, "percentage": 80.0, "elapsed_time": "0:16:07", "remaining_time": "0:04:01"}
{"current_steps": 410, "total_steps": 500, "loss": 2.9727, "learning_rate": 8.645971286271904e-06, "epoch": 3.2800000000000002, "percentage": 82.0, "elapsed_time": "0:16:31", "remaining_time": "0:03:37"}
{"current_steps": 420, "total_steps": 500, "loss": 2.9938, "learning_rate": 6.962898649802823e-06, "epoch": 3.36, "percentage": 84.0, "elapsed_time": "0:16:55", "remaining_time": "0:03:13"}
{"current_steps": 430, "total_steps": 500, "loss": 3.0744, "learning_rate": 5.449673790581611e-06, "epoch": 3.44, "percentage": 86.0, "elapsed_time": "0:17:20", "remaining_time": "0:02:49"}
{"current_steps": 440, "total_steps": 500, "loss": 2.9339, "learning_rate": 4.112268715800943e-06, "epoch": 3.52, "percentage": 88.0, "elapsed_time": "0:17:44", "remaining_time": "0:02:25"}
{"current_steps": 450, "total_steps": 500, "loss": 2.9912, "learning_rate": 2.9559615522887273e-06, "epoch": 3.6, "percentage": 90.0, "elapsed_time": "0:18:09", "remaining_time": "0:02:01"}
{"current_steps": 460, "total_steps": 500, "loss": 2.9679, "learning_rate": 1.985315716152847e-06, "epoch": 3.68, "percentage": 92.0, "elapsed_time": "0:18:33", "remaining_time": "0:01:36"}
{"current_steps": 470, "total_steps": 500, "loss": 3.0297, "learning_rate": 1.2041619030626284e-06, "epoch": 3.76, "percentage": 94.0, "elapsed_time": "0:18:57", "remaining_time": "0:01:12"}
{"current_steps": 480, "total_steps": 500, "loss": 2.9479, "learning_rate": 6.15582970243117e-07, "epoch": 3.84, "percentage": 96.0, "elapsed_time": "0:19:22", "remaining_time": "0:00:48"}
{"current_steps": 490, "total_steps": 500, "loss": 3.0567, "learning_rate": 2.219017698460002e-07, "epoch": 3.92, "percentage": 98.0, "elapsed_time": "0:19:46", "remaining_time": "0:00:24"}
{"current_steps": 500, "total_steps": 500, "loss": 3.0452, "learning_rate": 2.467198171342e-08, "epoch": 4.0, "percentage": 100.0, "elapsed_time": "0:20:10", "remaining_time": "0:00:00"}
{"current_steps": 500, "total_steps": 500, "epoch": 4.0, "percentage": 100.0, "elapsed_time": "0:20:20", "remaining_time": "0:00:00"}