ryanmarten commited on
Commit
8be2b92
·
verified ·
1 Parent(s): e9ba824

Training in progress, epoch 0

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a62f99f50a21734f8f1df654d9a8312a7bd3d0ad9c551f4b37e2f4e3b91b1466
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb5d7d3d1b58d34795b9a57cdbb586e3b89169154eece1f19e7c746ac9201447
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bd1cbaab3b47642d9aed11cccbacf59b6bb83a1fa22c44e269ee69d0bbc6f4a8
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12ef1cd4a6a4bbc48f2a8c5ed048d63317fbf75de734a3bafaa6aed6fa3ba725
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:334e6d8b0fc33f3c1f11dfc64aae4b71a4eca6003bdb196c35ea7f9ca2e3d8c6
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53b2fb80842898090414642236f7fabf33e5a627a3ded2a9e0cb9445ae71c7aa
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:db5c44d9e2bf0dd560620986b09b9235b51b56c963b90a139e937793c38a9538
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96fcc72042db9db5f772f8297da88861084d95dbcc00a0e60ac4288006877691
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -406,3 +406,185 @@
406
  {"current_steps": 158, "total_steps": 1230, "loss": 0.4187, "lr": 3.990142120595444e-05, "epoch": 0.64, "percentage": 12.85, "elapsed_time": "3:58:41", "remaining_time": "1 day, 2:59:28"}
407
  {"current_steps": 249, "total_steps": 1230, "loss": 0.3546, "lr": 3.873493415863256e-05, "epoch": 1.010126582278481, "percentage": 20.24, "elapsed_time": "6:10:55", "remaining_time": "1 day, 0:21:20"}
408
  {"current_steps": 159, "total_steps": 1230, "loss": 0.4257, "lr": 3.98957126299907e-05, "epoch": 0.6440506329113924, "percentage": 12.93, "elapsed_time": "4:00:12", "remaining_time": "1 day, 2:57:57"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
406
  {"current_steps": 158, "total_steps": 1230, "loss": 0.4187, "lr": 3.990142120595444e-05, "epoch": 0.64, "percentage": 12.85, "elapsed_time": "3:58:41", "remaining_time": "1 day, 2:59:28"}
407
  {"current_steps": 249, "total_steps": 1230, "loss": 0.3546, "lr": 3.873493415863256e-05, "epoch": 1.010126582278481, "percentage": 20.24, "elapsed_time": "6:10:55", "remaining_time": "1 day, 0:21:20"}
408
  {"current_steps": 159, "total_steps": 1230, "loss": 0.4257, "lr": 3.98957126299907e-05, "epoch": 0.6440506329113924, "percentage": 12.93, "elapsed_time": "4:00:12", "remaining_time": "1 day, 2:57:57"}
409
+ {"current_steps": 250, "total_steps": 1230, "loss": 0.3574, "lr": 3.871499275032111e-05, "epoch": 1.0141772151898734, "percentage": 20.33, "elapsed_time": "6:12:14", "remaining_time": "1 day, 0:19:11"}
410
+ {"current_steps": 160, "total_steps": 1230, "loss": 0.4388, "lr": 3.9889843816692596e-05, "epoch": 0.6481012658227848, "percentage": 13.01, "elapsed_time": "4:01:43", "remaining_time": "1 day, 2:56:28"}
411
+ {"current_steps": 251, "total_steps": 1230, "loss": 0.3434, "lr": 3.869490061403091e-05, "epoch": 1.0182278481012659, "percentage": 20.41, "elapsed_time": "6:13:39", "remaining_time": "1 day, 0:17:23"}
412
+ {"current_steps": 161, "total_steps": 1230, "loss": 0.4197, "lr": 3.9883814813326766e-05, "epoch": 0.6521518987341772, "percentage": 13.09, "elapsed_time": "4:02:49", "remaining_time": "1 day, 2:52:16"}
413
+ {"current_steps": 252, "total_steps": 1230, "loss": 0.3437, "lr": 3.867465791158124e-05, "epoch": 1.0222784810126582, "percentage": 20.49, "elapsed_time": "6:14:57", "remaining_time": "1 day, 0:15:11"}
414
+ {"current_steps": 162, "total_steps": 1230, "loss": 0.4339, "lr": 3.9877625668449956e-05, "epoch": 0.6562025316455696, "percentage": 13.17, "elapsed_time": "4:04:32", "remaining_time": "1 day, 2:52:11"}
415
+ {"current_steps": 253, "total_steps": 1230, "loss": 0.331, "lr": 3.865426480600407e-05, "epoch": 1.0263291139240507, "percentage": 20.57, "elapsed_time": "6:16:15", "remaining_time": "1 day, 0:12:58"}
416
+ {"current_steps": 163, "total_steps": 1230, "loss": 0.4212, "lr": 3.98712764319087e-05, "epoch": 0.660253164556962, "percentage": 13.25, "elapsed_time": "4:05:51", "remaining_time": "1 day, 2:49:21"}
417
+ {"current_steps": 254, "total_steps": 1230, "loss": 0.3585, "lr": 3.863372146154264e-05, "epoch": 1.030379746835443, "percentage": 20.65, "elapsed_time": "6:17:47", "remaining_time": "1 day, 0:11:40"}
418
+ {"current_steps": 164, "total_steps": 1230, "loss": 0.4527, "lr": 3.9864767154838864e-05, "epoch": 0.6643037974683544, "percentage": 13.33, "elapsed_time": "4:07:24", "remaining_time": "1 day, 2:48:06"}
419
+ {"current_steps": 255, "total_steps": 1230, "loss": 0.3454, "lr": 3.861302804365024e-05, "epoch": 1.0344303797468355, "percentage": 20.73, "elapsed_time": "6:19:03", "remaining_time": "1 day, 0:09:21"}
420
+ {"current_steps": 165, "total_steps": 1230, "loss": 0.435, "lr": 3.9858097889665277e-05, "epoch": 0.6683544303797468, "percentage": 13.41, "elapsed_time": "4:08:35", "remaining_time": "1 day, 2:44:35"}
421
+ {"current_steps": 256, "total_steps": 1230, "loss": 0.3457, "lr": 3.85921847189888e-05, "epoch": 1.0384810126582278, "percentage": 20.81, "elapsed_time": "6:20:25", "remaining_time": "1 day, 0:07:22"}
422
+ {"current_steps": 166, "total_steps": 1230, "loss": 0.43, "lr": 3.985126869010129e-05, "epoch": 0.6724050632911392, "percentage": 13.5, "elapsed_time": "4:09:56", "remaining_time": "1 day, 2:42:04"}
423
+ {"current_steps": 257, "total_steps": 1230, "loss": 0.3427, "lr": 3.85711916554276e-05, "epoch": 1.0425316455696203, "percentage": 20.89, "elapsed_time": "6:21:56", "remaining_time": "1 day, 0:06:01"}
424
+ {"current_steps": 167, "total_steps": 1230, "loss": 0.4426, "lr": 3.984427961114833e-05, "epoch": 0.6764556962025317, "percentage": 13.58, "elapsed_time": "4:11:19", "remaining_time": "1 day, 2:39:43"}
425
+ {"current_steps": 258, "total_steps": 1230, "loss": 0.3625, "lr": 3.85500490220419e-05, "epoch": 1.0465822784810126, "percentage": 20.98, "elapsed_time": "6:23:24", "remaining_time": "1 day, 0:04:29"}
426
+ {"current_steps": 168, "total_steps": 1230, "loss": 0.4138, "lr": 3.9837130709095475e-05, "epoch": 0.6805063291139241, "percentage": 13.66, "elapsed_time": "4:12:54", "remaining_time": "1 day, 2:38:42"}
427
+ {"current_steps": 259, "total_steps": 1230, "loss": 0.3385, "lr": 3.852875698911154e-05, "epoch": 1.0506329113924051, "percentage": 21.06, "elapsed_time": "6:24:40", "remaining_time": "1 day, 0:02:10"}
428
+ {"current_steps": 169, "total_steps": 1230, "loss": 0.4133, "lr": 3.982982204151901e-05, "epoch": 0.6845569620253165, "percentage": 13.74, "elapsed_time": "4:14:06", "remaining_time": "1 day, 2:35:18"}
429
+ {"current_steps": 260, "total_steps": 1230, "loss": 0.3394, "lr": 3.850731572811963e-05, "epoch": 1.0546835443037974, "percentage": 21.14, "elapsed_time": "6:26:00", "remaining_time": "1 day, 0:00:05"}
430
+ {"current_steps": 170, "total_steps": 1230, "loss": 0.406, "lr": 3.982235366728193e-05, "epoch": 0.6886075949367089, "percentage": 13.82, "elapsed_time": "4:15:27", "remaining_time": "1 day, 2:32:50"}
431
+ {"current_steps": 261, "total_steps": 1230, "loss": 0.343, "lr": 3.848572541175116e-05, "epoch": 1.05873417721519, "percentage": 21.22, "elapsed_time": "6:27:30", "remaining_time": "23:58:39"}
432
+ {"current_steps": 171, "total_steps": 1230, "loss": 0.4078, "lr": 3.9814725646533505e-05, "epoch": 0.6926582278481013, "percentage": 13.9, "elapsed_time": "4:16:45", "remaining_time": "1 day, 2:30:03"}
433
+ {"current_steps": 262, "total_steps": 1230, "loss": 0.3442, "lr": 3.846398621389154e-05, "epoch": 1.0627848101265822, "percentage": 21.3, "elapsed_time": "6:28:54", "remaining_time": "23:56:54"}
434
+ {"current_steps": 172, "total_steps": 1230, "loss": 0.4427, "lr": 3.9806938040708746e-05, "epoch": 0.6967088607594937, "percentage": 13.98, "elapsed_time": "4:18:14", "remaining_time": "1 day, 2:28:29"}
435
+ {"current_steps": 263, "total_steps": 1230, "loss": 0.3271, "lr": 3.84420983096253e-05, "epoch": 1.0668354430379747, "percentage": 21.38, "elapsed_time": "6:30:07", "remaining_time": "23:54:24"}
436
+ {"current_steps": 173, "total_steps": 1230, "loss": 0.4498, "lr": 3.9798990912527976e-05, "epoch": 0.7007594936708861, "percentage": 14.07, "elapsed_time": "4:20:01", "remaining_time": "1 day, 2:28:39"}
437
+ {"current_steps": 264, "total_steps": 1230, "loss": 0.3282, "lr": 3.8420061875234606e-05, "epoch": 1.070886075949367, "percentage": 21.46, "elapsed_time": "6:31:27", "remaining_time": "23:52:22"}
438
+ {"current_steps": 174, "total_steps": 1230, "loss": 0.4281, "lr": 3.979088432599627e-05, "epoch": 0.7048101265822785, "percentage": 14.15, "elapsed_time": "4:21:26", "remaining_time": "1 day, 2:26:40"}
439
+ {"current_steps": 265, "total_steps": 1230, "loss": 0.3279, "lr": 3.839787708819787e-05, "epoch": 1.0749367088607595, "percentage": 21.54, "elapsed_time": "6:32:43", "remaining_time": "23:50:05"}
440
+ {"current_steps": 175, "total_steps": 1230, "loss": 0.4096, "lr": 3.9782618346402964e-05, "epoch": 0.7088607594936709, "percentage": 14.23, "elapsed_time": "4:22:37", "remaining_time": "1 day, 2:23:16"}
441
+ {"current_steps": 266, "total_steps": 1230, "loss": 0.3359, "lr": 3.8375544127188325e-05, "epoch": 1.0789873417721518, "percentage": 21.63, "elapsed_time": "6:34:06", "remaining_time": "23:48:15"}
442
+ {"current_steps": 176, "total_steps": 1230, "loss": 0.4326, "lr": 3.977419304032111e-05, "epoch": 0.7129113924050633, "percentage": 14.31, "elapsed_time": "4:23:46", "remaining_time": "1 day, 2:19:39"}
443
+ {"current_steps": 267, "total_steps": 1230, "loss": 0.3208, "lr": 3.8353063172072564e-05, "epoch": 1.0830379746835443, "percentage": 21.71, "elapsed_time": "6:35:21", "remaining_time": "23:45:55"}
444
+ {"current_steps": 177, "total_steps": 1230, "loss": 0.4298, "lr": 3.976560847560697e-05, "epoch": 0.7169620253164557, "percentage": 14.39, "elapsed_time": "4:25:15", "remaining_time": "1 day, 2:18:02"}
445
+ {"current_steps": 268, "total_steps": 1230, "loss": 0.3418, "lr": 3.8330434403909105e-05, "epoch": 1.0870886075949366, "percentage": 21.79, "elapsed_time": "6:36:57", "remaining_time": "23:44:55"}
446
+ {"current_steps": 178, "total_steps": 1230, "loss": 0.4233, "lr": 3.9756864721399456e-05, "epoch": 0.7210126582278481, "percentage": 14.47, "elapsed_time": "4:26:25", "remaining_time": "1 day, 2:14:38"}
447
+ {"current_steps": 269, "total_steps": 1230, "loss": 0.3516, "lr": 3.8307658004946934e-05, "epoch": 1.0911392405063292, "percentage": 21.87, "elapsed_time": "6:38:12", "remaining_time": "23:42:34"}
448
+ {"current_steps": 179, "total_steps": 1230, "loss": 0.4118, "lr": 3.974796184811956e-05, "epoch": 0.7250632911392405, "percentage": 14.55, "elapsed_time": "4:27:43", "remaining_time": "1 day, 2:11:54"}
449
+ {"current_steps": 270, "total_steps": 1230, "loss": 0.3188, "lr": 3.8284734158624046e-05, "epoch": 1.0951898734177214, "percentage": 21.95, "elapsed_time": "6:39:24", "remaining_time": "23:40:05"}
450
+ {"current_steps": 180, "total_steps": 1230, "loss": 0.4444, "lr": 3.973889992746979e-05, "epoch": 0.7291139240506329, "percentage": 14.63, "elapsed_time": "4:29:17", "remaining_time": "1 day, 2:10:54"}
451
+ {"current_steps": 271, "total_steps": 1230, "loss": 0.3331, "lr": 3.826166304956594e-05, "epoch": 1.099240506329114, "percentage": 22.03, "elapsed_time": "6:40:56", "remaining_time": "23:38:48"}
452
+ {"current_steps": 181, "total_steps": 1230, "loss": 0.4172, "lr": 3.972967903243361e-05, "epoch": 0.7331645569620253, "percentage": 14.72, "elapsed_time": "4:30:40", "remaining_time": "1 day, 2:08:41"}
453
+ {"current_steps": 272, "total_steps": 1230, "loss": 0.3413, "lr": 3.8238444863584164e-05, "epoch": 1.1032911392405063, "percentage": 22.11, "elapsed_time": "6:42:30", "remaining_time": "23:37:38"}
454
+ {"current_steps": 182, "total_steps": 1230, "loss": 0.4329, "lr": 3.972029923727486e-05, "epoch": 0.7372151898734177, "percentage": 14.8, "elapsed_time": "4:32:01", "remaining_time": "1 day, 2:06:22"}
455
+ {"current_steps": 273, "total_steps": 1230, "loss": 0.3381, "lr": 3.821507978767479e-05, "epoch": 1.1073417721518988, "percentage": 22.2, "elapsed_time": "6:43:58", "remaining_time": "23:36:09"}
456
+ {"current_steps": 183, "total_steps": 1230, "loss": 0.4191, "lr": 3.971076061753709e-05, "epoch": 0.7412658227848101, "percentage": 14.88, "elapsed_time": "4:33:26", "remaining_time": "1 day, 2:04:29"}
457
+ {"current_steps": 274, "total_steps": 1230, "loss": 0.3163, "lr": 3.819156801001693e-05, "epoch": 1.111392405063291, "percentage": 22.28, "elapsed_time": "6:45:08", "remaining_time": "23:33:35"}
458
+ {"current_steps": 184, "total_steps": 1230, "loss": 0.4264, "lr": 3.9701063250043066e-05, "epoch": 0.7453164556962025, "percentage": 14.96, "elapsed_time": "4:34:52", "remaining_time": "1 day, 2:02:34"}
459
+ {"current_steps": 275, "total_steps": 1230, "loss": 0.322, "lr": 3.816790971997121e-05, "epoch": 1.1154430379746836, "percentage": 22.36, "elapsed_time": "6:46:16", "remaining_time": "23:30:53"}
460
+ {"current_steps": 185, "total_steps": 1230, "loss": 0.4003, "lr": 3.969120721289402e-05, "epoch": 0.7493670886075949, "percentage": 15.04, "elapsed_time": "4:36:08", "remaining_time": "1 day, 1:59:46"}
461
+ {"current_steps": 276, "total_steps": 1230, "loss": 0.3307, "lr": 3.8144105108078246e-05, "epoch": 1.1194936708860759, "percentage": 22.44, "elapsed_time": "6:47:33", "remaining_time": "23:28:45"}
462
+ {"current_steps": 186, "total_steps": 1230, "loss": 0.4078, "lr": 3.9681192585469146e-05, "epoch": 0.7534177215189873, "percentage": 15.12, "elapsed_time": "4:37:39", "remaining_time": "1 day, 1:58:27"}
463
+ {"current_steps": 277, "total_steps": 1230, "loss": 0.3656, "lr": 3.81201543660571e-05, "epoch": 1.1235443037974684, "percentage": 22.52, "elapsed_time": "6:49:09", "remaining_time": "23:27:41"}
464
+ {"current_steps": 187, "total_steps": 1230, "loss": 0.4259, "lr": 3.9671019448424865e-05, "epoch": 0.7574683544303797, "percentage": 15.2, "elapsed_time": "4:39:05", "remaining_time": "1 day, 1:56:36"}
465
+ {"current_steps": 278, "total_steps": 1230, "loss": 0.348, "lr": 3.809605768680377e-05, "epoch": 1.1275949367088607, "percentage": 22.6, "elapsed_time": "6:50:39", "remaining_time": "23:26:18"}
466
+ {"current_steps": 188, "total_steps": 1230, "loss": 0.4074, "lr": 3.966068788369422e-05, "epoch": 0.7615189873417721, "percentage": 15.28, "elapsed_time": "4:40:28", "remaining_time": "1 day, 1:54:32"}
467
+ {"current_steps": 279, "total_steps": 1230, "loss": 0.3231, "lr": 3.807181526438958e-05, "epoch": 1.1316455696202532, "percentage": 22.68, "elapsed_time": "6:52:10", "remaining_time": "23:24:55"}
468
+ {"current_steps": 189, "total_steps": 1230, "loss": 0.4163, "lr": 3.965019797448622e-05, "epoch": 0.7655696202531646, "percentage": 15.37, "elapsed_time": "4:41:39", "remaining_time": "1 day, 1:51:21"}
469
+ {"current_steps": 280, "total_steps": 1230, "loss": 0.3392, "lr": 3.8047427294059697e-05, "epoch": 1.1356962025316455, "percentage": 22.76, "elapsed_time": "6:53:21", "remaining_time": "23:22:28"}
470
+ {"current_steps": 190, "total_steps": 1230, "loss": 0.427, "lr": 3.963954980528515e-05, "epoch": 0.769620253164557, "percentage": 15.45, "elapsed_time": "4:43:06", "remaining_time": "1 day, 1:49:39"}
471
+ {"current_steps": 281, "total_steps": 1230, "loss": 0.3166, "lr": 3.802289397223145e-05, "epoch": 1.139746835443038, "percentage": 22.85, "elapsed_time": "6:54:34", "remaining_time": "23:20:08"}
472
+ {"current_steps": 191, "total_steps": 1230, "loss": 0.4212, "lr": 3.9628743461849905e-05, "epoch": 0.7736708860759494, "percentage": 15.53, "elapsed_time": "4:44:39", "remaining_time": "1 day, 1:48:27"}
473
+ {"current_steps": 282, "total_steps": 1230, "loss": 0.3383, "lr": 3.7998215496492854e-05, "epoch": 1.1437974683544303, "percentage": 22.93, "elapsed_time": "6:56:16", "remaining_time": "23:19:22"}
474
+ {"current_steps": 192, "total_steps": 1230, "loss": 0.4223, "lr": 3.961777903121329e-05, "epoch": 0.7777215189873418, "percentage": 15.61, "elapsed_time": "4:46:00", "remaining_time": "1 day, 1:46:13"}
475
+ {"current_steps": 283, "total_steps": 1230, "loss": 0.343, "lr": 3.797339206560096e-05, "epoch": 1.1478481012658228, "percentage": 23.01, "elapsed_time": "6:57:50", "remaining_time": "23:18:14"}
476
+ {"current_steps": 193, "total_steps": 1230, "loss": 0.4185, "lr": 3.960665660168131e-05, "epoch": 0.7817721518987342, "percentage": 15.69, "elapsed_time": "4:47:26", "remaining_time": "1 day, 1:44:24"}
477
+ {"current_steps": 284, "total_steps": 1230, "loss": 0.3316, "lr": 3.794842387948027e-05, "epoch": 1.1518987341772151, "percentage": 23.09, "elapsed_time": "6:59:06", "remaining_time": "23:16:02"}
478
+ {"current_steps": 194, "total_steps": 1230, "loss": 0.4147, "lr": 3.9595376262832485e-05, "epoch": 0.7858227848101266, "percentage": 15.77, "elapsed_time": "4:48:55", "remaining_time": "1 day, 1:42:54"}
479
+ {"current_steps": 285, "total_steps": 1230, "loss": 0.3522, "lr": 3.7923311139221114e-05, "epoch": 1.1559493670886076, "percentage": 23.17, "elapsed_time": "7:00:27", "remaining_time": "23:14:10"}
480
+ {"current_steps": 195, "total_steps": 1230, "loss": 0.4427, "lr": 3.9583938105517127e-05, "epoch": 0.789873417721519, "percentage": 15.85, "elapsed_time": "4:50:27", "remaining_time": "1 day, 1:41:41"}
481
+ {"current_steps": 286, "total_steps": 1230, "loss": 0.3518, "lr": 3.7898054047078054e-05, "epoch": 1.16, "percentage": 23.25, "elapsed_time": "7:01:54", "remaining_time": "23:12:34"}
482
+ {"current_steps": 196, "total_steps": 1230, "loss": 0.4154, "lr": 3.957234222185657e-05, "epoch": 0.7939240506329114, "percentage": 15.93, "elapsed_time": "4:51:31", "remaining_time": "1 day, 1:37:55"}
483
+ {"current_steps": 287, "total_steps": 1230, "loss": 0.3456, "lr": 3.787265280646825e-05, "epoch": 1.1640506329113924, "percentage": 23.33, "elapsed_time": "7:03:23", "remaining_time": "23:11:09"}
484
+ {"current_steps": 197, "total_steps": 1230, "loss": 0.4325, "lr": 3.9560588705242474e-05, "epoch": 0.7979746835443038, "percentage": 16.02, "elapsed_time": "4:52:57", "remaining_time": "1 day, 1:36:08"}
485
+ {"current_steps": 288, "total_steps": 1230, "loss": 0.3455, "lr": 3.7847107621969786e-05, "epoch": 1.1681012658227847, "percentage": 23.41, "elapsed_time": "7:04:43", "remaining_time": "23:09:11"}
486
+ {"current_steps": 198, "total_steps": 1230, "loss": 0.4294, "lr": 3.954867765033605e-05, "epoch": 0.8020253164556962, "percentage": 16.1, "elapsed_time": "4:54:24", "remaining_time": "1 day, 1:34:30"}
487
+ {"current_steps": 289, "total_steps": 1230, "loss": 0.339, "lr": 3.7821418699320064e-05, "epoch": 1.1721518987341772, "percentage": 23.5, "elapsed_time": "7:06:03", "remaining_time": "23:07:17"}
488
+ {"current_steps": 199, "total_steps": 1230, "loss": 0.4488, "lr": 3.953660915306728e-05, "epoch": 0.8060759493670886, "percentage": 16.18, "elapsed_time": "4:55:46", "remaining_time": "1 day, 1:32:22"}
489
+ {"current_steps": 290, "total_steps": 1230, "loss": 0.3417, "lr": 3.7795586245414145e-05, "epoch": 1.1762025316455695, "percentage": 23.58, "elapsed_time": "7:07:16", "remaining_time": "23:04:58"}
490
+ {"current_steps": 200, "total_steps": 1230, "loss": 0.4483, "lr": 3.952438331063419e-05, "epoch": 0.810126582278481, "percentage": 16.26, "elapsed_time": "4:57:12", "remaining_time": "1 day, 1:30:39"}
491
+ {"current_steps": 291, "total_steps": 1230, "loss": 0.3435, "lr": 3.776961046830306e-05, "epoch": 1.180253164556962, "percentage": 23.66, "elapsed_time": "7:08:35", "remaining_time": "23:02:59"}
492
+ {"current_steps": 201, "total_steps": 1230, "loss": 0.4265, "lr": 3.951200022150205e-05, "epoch": 0.8141772151898734, "percentage": 16.34, "elapsed_time": "4:58:26", "remaining_time": "1 day, 1:27:50"}
493
+ {"current_steps": 292, "total_steps": 1230, "loss": 0.3279, "lr": 3.774349157719215e-05, "epoch": 1.1843037974683543, "percentage": 23.74, "elapsed_time": "7:09:46", "remaining_time": "23:00:35"}
494
+ {"current_steps": 202, "total_steps": 1230, "loss": 0.4062, "lr": 3.949945998540253e-05, "epoch": 0.8182278481012658, "percentage": 16.42, "elapsed_time": "4:59:55", "remaining_time": "1 day, 1:26:23"}
495
+ {"current_steps": 293, "total_steps": 1230, "loss": 0.3268, "lr": 3.7717229782439365e-05, "epoch": 1.1883544303797469, "percentage": 23.82, "elapsed_time": "7:11:13", "remaining_time": "22:59:00"}
496
+ {"current_steps": 203, "total_steps": 1230, "loss": 0.419, "lr": 3.9486762703332993e-05, "epoch": 0.8222784810126582, "percentage": 16.5, "elapsed_time": "5:01:02", "remaining_time": "1 day, 1:23:00"}
497
+ {"current_steps": 294, "total_steps": 1230, "loss": 0.3322, "lr": 3.769082529555359e-05, "epoch": 1.1924050632911392, "percentage": 23.9, "elapsed_time": "7:12:36", "remaining_time": "22:57:16"}
498
+ {"current_steps": 204, "total_steps": 1230, "loss": 0.4312, "lr": 3.947390847755559e-05, "epoch": 0.8263291139240506, "percentage": 16.59, "elapsed_time": "5:02:25", "remaining_time": "1 day, 1:21:01"}
499
+ {"current_steps": 295, "total_steps": 1230, "loss": 0.3567, "lr": 3.766427832919294e-05, "epoch": 1.1964556962025317, "percentage": 23.98, "elapsed_time": "7:14:10", "remaining_time": "22:56:06"}
500
+ {"current_steps": 205, "total_steps": 1230, "loss": 0.4375, "lr": 3.946089741159648e-05, "epoch": 0.830379746835443, "percentage": 16.67, "elapsed_time": "5:04:01", "remaining_time": "1 day, 1:20:06"}
501
+ {"current_steps": 296, "total_steps": 1230, "loss": 0.3332, "lr": 3.7637589097163024e-05, "epoch": 1.200506329113924, "percentage": 24.07, "elapsed_time": "7:15:30", "remaining_time": "22:54:12"}
502
+ {"current_steps": 206, "total_steps": 1230, "loss": 0.407, "lr": 3.944772961024501e-05, "epoch": 0.8344303797468354, "percentage": 16.75, "elapsed_time": "5:05:23", "remaining_time": "1 day, 1:18:02"}
503
+ {"current_steps": 297, "total_steps": 1230, "loss": 0.3475, "lr": 3.761075781441526e-05, "epoch": 1.2045569620253165, "percentage": 24.15, "elapsed_time": "7:16:48", "remaining_time": "22:52:12"}
504
+ {"current_steps": 207, "total_steps": 1230, "loss": 0.4144, "lr": 3.943440517955285e-05, "epoch": 0.8384810126582278, "percentage": 16.83, "elapsed_time": "5:06:39", "remaining_time": "1 day, 1:15:29"}
505
+ {"current_steps": 298, "total_steps": 1230, "loss": 0.338, "lr": 3.75837846970451e-05, "epoch": 1.2086075949367088, "percentage": 24.23, "elapsed_time": "7:18:13", "remaining_time": "22:50:32"}
506
+ {"current_steps": 208, "total_steps": 1230, "loss": 0.4, "lr": 3.9420924226833126e-05, "epoch": 0.8425316455696202, "percentage": 16.91, "elapsed_time": "5:08:09", "remaining_time": "1 day, 1:14:06"}
507
+ {"current_steps": 299, "total_steps": 1230, "loss": 0.3479, "lr": 3.755666996229032e-05, "epoch": 1.2126582278481013, "percentage": 24.31, "elapsed_time": "7:19:36", "remaining_time": "22:48:47"}
508
+ {"current_steps": 209, "total_steps": 1230, "loss": 0.426, "lr": 3.9407286860659566e-05, "epoch": 0.8465822784810126, "percentage": 16.99, "elapsed_time": "5:09:25", "remaining_time": "1 day, 1:11:35"}
509
+ {"current_steps": 300, "total_steps": 1230, "loss": 0.3351, "lr": 3.752941382852927e-05, "epoch": 1.2167088607594936, "percentage": 24.39, "elapsed_time": "7:20:46", "remaining_time": "22:46:25"}
510
+ {"current_steps": 301, "total_steps": 1230, "loss": 0.3318, "lr": 3.7502016515279115e-05, "epoch": 1.220759493670886, "percentage": 24.47, "elapsed_time": "7:22:03", "remaining_time": "22:44:21"}
511
+ {"current_steps": 210, "total_steps": 1230, "loss": 0.4249, "lr": 3.9393493190865657e-05, "epoch": 0.850632911392405, "percentage": 17.07, "elapsed_time": "5:10:57", "remaining_time": "1 day, 1:10:24"}
512
+ {"current_steps": 302, "total_steps": 1230, "loss": 0.3607, "lr": 3.7474478243194043e-05, "epoch": 1.2248101265822784, "percentage": 24.55, "elapsed_time": "7:23:31", "remaining_time": "22:42:53"}
513
+ {"current_steps": 211, "total_steps": 1230, "loss": 0.4164, "lr": 3.937954332854371e-05, "epoch": 0.8546835443037974, "percentage": 17.15, "elapsed_time": "5:12:27", "remaining_time": "1 day, 1:08:56"}
514
+ {"current_steps": 303, "total_steps": 1230, "loss": 0.3401, "lr": 3.744679923406351e-05, "epoch": 1.228860759493671, "percentage": 24.63, "elapsed_time": "7:24:56", "remaining_time": "22:41:16"}
515
+ {"current_steps": 212, "total_steps": 1230, "loss": 0.4259, "lr": 3.9365437386044016e-05, "epoch": 0.8587341772151899, "percentage": 17.24, "elapsed_time": "5:13:50", "remaining_time": "1 day, 1:07:00"}
516
+ {"current_steps": 213, "total_steps": 1230, "loss": 0.4079, "lr": 3.935117547697387e-05, "epoch": 0.8627848101265823, "percentage": 17.32, "elapsed_time": "5:15:11", "remaining_time": "1 day, 1:04:53"}
517
+ {"current_steps": 304, "total_steps": 1230, "loss": 0.3534, "lr": 3.741897971081043e-05, "epoch": 1.2329113924050632, "percentage": 24.72, "elapsed_time": "7:26:20", "remaining_time": "22:39:33"}
518
+ {"current_steps": 305, "total_steps": 1230, "loss": 0.3313, "lr": 3.739101989748946e-05, "epoch": 1.2369620253164557, "percentage": 24.8, "elapsed_time": "7:27:44", "remaining_time": "22:37:53"}
519
+ {"current_steps": 214, "total_steps": 1230, "loss": 0.4052, "lr": 3.933675771619675e-05, "epoch": 0.8668354430379747, "percentage": 17.4, "elapsed_time": "5:16:36", "remaining_time": "1 day, 1:03:08"}
520
+ {"current_steps": 215, "total_steps": 1230, "loss": 0.4111, "lr": 3.932218421983131e-05, "epoch": 0.8708860759493671, "percentage": 17.48, "elapsed_time": "5:18:01", "remaining_time": "1 day, 1:01:21"}
521
+ {"current_steps": 306, "total_steps": 1230, "loss": 0.3536, "lr": 3.7362920019285066e-05, "epoch": 1.241012658227848, "percentage": 24.88, "elapsed_time": "7:29:27", "remaining_time": "22:37:11"}
522
+ {"current_steps": 216, "total_steps": 1230, "loss": 0.4185, "lr": 3.9307455105250484e-05, "epoch": 0.8749367088607595, "percentage": 17.56, "elapsed_time": "5:19:33", "remaining_time": "1 day, 1:00:08"}
523
+ {"current_steps": 307, "total_steps": 1230, "loss": 0.3257, "lr": 3.73346803025098e-05, "epoch": 1.2450632911392405, "percentage": 24.96, "elapsed_time": "7:30:47", "remaining_time": "22:35:17"}
524
+ {"current_steps": 308, "total_steps": 1230, "loss": 0.3373, "lr": 3.730630097460247e-05, "epoch": 1.2491139240506328, "percentage": 25.04, "elapsed_time": "7:32:01", "remaining_time": "22:33:08"}
525
+ {"current_steps": 217, "total_steps": 1230, "loss": 0.4063, "lr": 3.929257049108054e-05, "epoch": 0.8789873417721519, "percentage": 17.64, "elapsed_time": "5:20:53", "remaining_time": "1 day, 0:57:57"}
526
+ {"current_steps": 309, "total_steps": 1230, "loss": 0.3443, "lr": 3.727778226412628e-05, "epoch": 1.2531645569620253, "percentage": 25.12, "elapsed_time": "7:33:23", "remaining_time": "22:31:23"}
527
+ {"current_steps": 218, "total_steps": 1230, "loss": 0.432, "lr": 3.927753049720011e-05, "epoch": 0.8830379746835443, "percentage": 17.72, "elapsed_time": "5:22:23", "remaining_time": "1 day, 0:56:34"}
528
+ {"current_steps": 310, "total_steps": 1230, "loss": 0.3423, "lr": 3.7249124400767006e-05, "epoch": 1.2572151898734178, "percentage": 25.2, "elapsed_time": "7:34:56", "remaining_time": "22:30:08"}
529
+ {"current_steps": 219, "total_steps": 1230, "loss": 0.4165, "lr": 3.9262335244739234e-05, "epoch": 0.8870886075949367, "percentage": 17.8, "elapsed_time": "5:23:49", "remaining_time": "1 day, 0:54:56"}
530
+ {"current_steps": 220, "total_steps": 1230, "loss": 0.4144, "lr": 3.92469848560784e-05, "epoch": 0.8911392405063291, "percentage": 17.89, "elapsed_time": "5:25:02", "remaining_time": "1 day, 0:52:15"}
531
+ {"current_steps": 311, "total_steps": 1230, "loss": 0.3322, "lr": 3.722032761533114e-05, "epoch": 1.2612658227848101, "percentage": 25.28, "elapsed_time": "7:36:21", "remaining_time": "22:28:31"}
532
+ {"current_steps": 221, "total_steps": 1230, "loss": 0.4165, "lr": 3.923147945484751e-05, "epoch": 0.8951898734177215, "percentage": 17.97, "elapsed_time": "5:26:22", "remaining_time": "1 day, 0:50:04"}
533
+ {"current_steps": 312, "total_steps": 1230, "loss": 0.3569, "lr": 3.719139213974403e-05, "epoch": 1.2653164556962024, "percentage": 25.37, "elapsed_time": "7:37:46", "remaining_time": "22:26:54"}
534
+ {"current_steps": 222, "total_steps": 1230, "loss": 0.3999, "lr": 3.9215819165924956e-05, "epoch": 0.8992405063291139, "percentage": 18.05, "elapsed_time": "5:27:49", "remaining_time": "1 day, 0:48:29"}
535
+ {"current_steps": 313, "total_steps": 1230, "loss": 0.3229, "lr": 3.7162318207048006e-05, "epoch": 1.269367088607595, "percentage": 25.45, "elapsed_time": "7:39:02", "remaining_time": "22:24:50"}
536
+ {"current_steps": 223, "total_steps": 1230, "loss": 0.3956, "lr": 3.920000411543654e-05, "epoch": 0.9032911392405063, "percentage": 18.13, "elapsed_time": "5:29:02", "remaining_time": "1 day, 0:45:49"}
537
+ {"current_steps": 314, "total_steps": 1230, "loss": 0.3477, "lr": 3.713310605140055e-05, "epoch": 1.2734177215189875, "percentage": 25.53, "elapsed_time": "7:40:21", "remaining_time": "22:22:57"}
538
+ {"current_steps": 315, "total_steps": 1230, "loss": 0.3443, "lr": 3.710375590807233e-05, "epoch": 1.2774683544303798, "percentage": 25.61, "elapsed_time": "7:41:36", "remaining_time": "22:20:50"}
539
+ {"current_steps": 224, "total_steps": 1230, "loss": 0.4166, "lr": 3.9184034430754495e-05, "epoch": 0.9073417721518987, "percentage": 18.21, "elapsed_time": "5:30:30", "remaining_time": "1 day, 0:44:19"}
540
+ {"current_steps": 225, "total_steps": 1230, "loss": 0.4191, "lr": 3.916791024049648e-05, "epoch": 0.9113924050632911, "percentage": 18.29, "elapsed_time": "5:31:50", "remaining_time": "1 day, 0:42:15"}
541
+ {"current_steps": 316, "total_steps": 1230, "loss": 0.3414, "lr": 3.7074268013445365e-05, "epoch": 1.281518987341772, "percentage": 25.69, "elapsed_time": "7:43:00", "remaining_time": "22:19:12"}
542
+ {"current_steps": 317, "total_steps": 1230, "loss": 0.3305, "lr": 3.7044642605011114e-05, "epoch": 1.2855696202531646, "percentage": 25.77, "elapsed_time": "7:44:09", "remaining_time": "22:16:49"}
543
+ {"current_steps": 226, "total_steps": 1230, "loss": 0.4092, "lr": 3.91516316745245e-05, "epoch": 0.9154430379746835, "percentage": 18.37, "elapsed_time": "5:33:16", "remaining_time": "1 day, 0:40:35"}
544
+ {"current_steps": 318, "total_steps": 1230, "loss": 0.3483, "lr": 3.701487992136854e-05, "epoch": 1.289620253164557, "percentage": 25.85, "elapsed_time": "7:45:33", "remaining_time": "22:15:11"}
545
+ {"current_steps": 227, "total_steps": 1230, "loss": 0.4078, "lr": 3.913519886394389e-05, "epoch": 0.9194936708860759, "percentage": 18.46, "elapsed_time": "5:34:34", "remaining_time": "1 day, 0:38:21"}
546
+ {"current_steps": 319, "total_steps": 1230, "loss": 0.3483, "lr": 3.69849802022222e-05, "epoch": 1.2936708860759494, "percentage": 25.93, "elapsed_time": "7:46:51", "remaining_time": "22:13:14"}
547
+ {"current_steps": 228, "total_steps": 1230, "loss": 0.4153, "lr": 3.911861194110225e-05, "epoch": 0.9235443037974683, "percentage": 18.54, "elapsed_time": "5:35:53", "remaining_time": "1 day, 0:36:11"}
548
+ {"current_steps": 320, "total_steps": 1230, "loss": 0.3465, "lr": 3.6954943688380334e-05, "epoch": 1.2977215189873417, "percentage": 26.02, "elapsed_time": "7:48:24", "remaining_time": "22:12:00"}
549
+ {"current_steps": 229, "total_steps": 1230, "loss": 0.406, "lr": 3.910187103958837e-05, "epoch": 0.9275949367088607, "percentage": 18.62, "elapsed_time": "5:37:15", "remaining_time": "1 day, 0:34:13"}
550
+ {"current_steps": 321, "total_steps": 1230, "loss": 0.3396, "lr": 3.692477062175289e-05, "epoch": 1.3017721518987342, "percentage": 26.1, "elapsed_time": "7:49:53", "remaining_time": "22:10:36"}
551
+ {"current_steps": 230, "total_steps": 1230, "loss": 0.4173, "lr": 3.908497629423117e-05, "epoch": 0.9316455696202531, "percentage": 18.7, "elapsed_time": "5:38:47", "remaining_time": "1 day, 0:33:00"}
552
+ {"current_steps": 322, "total_steps": 1230, "loss": 0.3492, "lr": 3.689446124534958e-05, "epoch": 1.3058227848101267, "percentage": 26.18, "elapsed_time": "7:51:11", "remaining_time": "22:08:42"}
553
+ {"current_steps": 231, "total_steps": 1230, "loss": 0.4185, "lr": 3.9067927841098614e-05, "epoch": 0.9356962025316455, "percentage": 18.78, "elapsed_time": "5:40:13", "remaining_time": "1 day, 0:31:20"}
554
+ {"current_steps": 232, "total_steps": 1230, "loss": 0.4003, "lr": 3.9050725817496594e-05, "epoch": 0.9397468354430379, "percentage": 18.86, "elapsed_time": "5:41:30", "remaining_time": "1 day, 0:29:04"}
555
+ {"current_steps": 323, "total_steps": 1230, "loss": 0.3445, "lr": 3.686401580327799e-05, "epoch": 1.309873417721519, "percentage": 26.26, "elapsed_time": "7:52:46", "remaining_time": "22:07:34"}
556
+ {"current_steps": 324, "total_steps": 1230, "loss": 0.3336, "lr": 3.683343454074149e-05, "epoch": 1.3139240506329113, "percentage": 26.34, "elapsed_time": "7:54:03", "remaining_time": "22:05:35"}
557
+ {"current_steps": 233, "total_steps": 1230, "loss": 0.4225, "lr": 3.9033370361967844e-05, "epoch": 0.9437974683544303, "percentage": 18.94, "elapsed_time": "5:43:09", "remaining_time": "1 day, 0:28:19"}
558
+ {"current_steps": 325, "total_steps": 1230, "loss": 0.3431, "lr": 3.6802717704037386e-05, "epoch": 1.3179746835443038, "percentage": 26.42, "elapsed_time": "7:55:28", "remaining_time": "22:04:00"}
559
+ {"current_steps": 234, "total_steps": 1230, "loss": 0.4285, "lr": 3.901586161429081e-05, "epoch": 0.9478481012658228, "percentage": 19.02, "elapsed_time": "5:44:50", "remaining_time": "1 day, 0:27:48"}
560
+ {"current_steps": 326, "total_steps": 1230, "loss": 0.3306, "lr": 3.6771865540554855e-05, "epoch": 1.3220253164556963, "percentage": 26.5, "elapsed_time": "7:56:48", "remaining_time": "22:02:10"}
561
+ {"current_steps": 235, "total_steps": 1230, "loss": 0.4238, "lr": 3.8998199715478545e-05, "epoch": 0.9518987341772152, "percentage": 19.11, "elapsed_time": "5:46:16", "remaining_time": "1 day, 0:26:09"}
562
+ {"current_steps": 327, "total_steps": 1230, "loss": 0.3588, "lr": 3.674087829877297e-05, "epoch": 1.3260759493670886, "percentage": 26.59, "elapsed_time": "7:58:20", "remaining_time": "22:00:56"}
563
+ {"current_steps": 236, "total_steps": 1230, "loss": 0.4131, "lr": 3.8980384807777564e-05, "epoch": 0.9559493670886076, "percentage": 19.19, "elapsed_time": "5:47:39", "remaining_time": "1 day, 0:24:17"}
564
+ {"current_steps": 328, "total_steps": 1230, "loss": 0.3282, "lr": 3.6709756228258735e-05, "epoch": 1.330126582278481, "percentage": 26.67, "elapsed_time": "7:59:36", "remaining_time": "21:58:54"}
565
+ {"current_steps": 237, "total_steps": 1230, "loss": 0.4205, "lr": 3.896241703466667e-05, "epoch": 0.96, "percentage": 19.27, "elapsed_time": "5:49:04", "remaining_time": "1 day, 0:22:35"}
566
+ {"current_steps": 329, "total_steps": 1230, "loss": 0.3388, "lr": 3.667849957966501e-05, "epoch": 1.3341772151898734, "percentage": 26.75, "elapsed_time": "8:00:55", "remaining_time": "21:57:04"}
567
+ {"current_steps": 238, "total_steps": 1230, "loss": 0.4128, "lr": 3.894429654085585e-05, "epoch": 0.9640506329113924, "percentage": 19.35, "elapsed_time": "5:50:36", "remaining_time": "1 day, 0:21:21"}
568
+ {"current_steps": 330, "total_steps": 1230, "loss": 0.34, "lr": 3.6647108604728546e-05, "epoch": 1.338227848101266, "percentage": 26.83, "elapsed_time": "8:02:09", "remaining_time": "21:54:57"}
569
+ {"current_steps": 239, "total_steps": 1230, "loss": 0.4032, "lr": 3.892602347228505e-05, "epoch": 0.9681012658227848, "percentage": 19.43, "elapsed_time": "5:52:06", "remaining_time": "1 day, 0:19:58"}
570
+ {"current_steps": 331, "total_steps": 1230, "loss": 0.3397, "lr": 3.661558355626795e-05, "epoch": 1.3422784810126582, "percentage": 26.91, "elapsed_time": "8:03:38", "remaining_time": "21:53:35"}
571
+ {"current_steps": 240, "total_steps": 1230, "loss": 0.4068, "lr": 3.890759797612307e-05, "epoch": 0.9721518987341772, "percentage": 19.51, "elapsed_time": "5:53:11", "remaining_time": "1 day, 0:16:56"}
572
+ {"current_steps": 332, "total_steps": 1230, "loss": 0.3464, "lr": 3.658392468818163e-05, "epoch": 1.3463291139240505, "percentage": 26.99, "elapsed_time": "8:04:58", "remaining_time": "21:51:47"}
573
+ {"current_steps": 241, "total_steps": 1230, "loss": 0.42, "lr": 3.888902020076632e-05, "epoch": 0.9762025316455696, "percentage": 19.59, "elapsed_time": "5:54:33", "remaining_time": "1 day, 0:15:01"}
574
+ {"current_steps": 333, "total_steps": 1230, "loss": 0.3508, "lr": 3.655213225544574e-05, "epoch": 1.350379746835443, "percentage": 27.07, "elapsed_time": "8:06:27", "remaining_time": "21:50:22"}
575
+ {"current_steps": 242, "total_steps": 1230, "loss": 0.4204, "lr": 3.887029029583764e-05, "epoch": 0.980253164556962, "percentage": 19.67, "elapsed_time": "5:56:05", "remaining_time": "1 day, 0:13:47"}
576
+ {"current_steps": 334, "total_steps": 1230, "loss": 0.3366, "lr": 3.652020651411218e-05, "epoch": 1.3544303797468356, "percentage": 27.15, "elapsed_time": "8:07:51", "remaining_time": "21:48:45"}
577
+ {"current_steps": 243, "total_steps": 1230, "loss": 0.4252, "lr": 3.8851408412185125e-05, "epoch": 0.9843037974683544, "percentage": 19.76, "elapsed_time": "5:57:39", "remaining_time": "1 day, 0:12:43"}
578
+ {"current_steps": 335, "total_steps": 1230, "loss": 0.3463, "lr": 3.6488147721306474e-05, "epoch": 1.3584810126582278, "percentage": 27.24, "elapsed_time": "8:09:15", "remaining_time": "21:47:06"}
579
+ {"current_steps": 244, "total_steps": 1230, "loss": 0.4339, "lr": 3.8832374701880855e-05, "epoch": 0.9883544303797468, "percentage": 19.84, "elapsed_time": "5:58:55", "remaining_time": "1 day, 0:10:23"}
580
+ {"current_steps": 336, "total_steps": 1230, "loss": 0.3488, "lr": 3.645595613522574e-05, "epoch": 1.3625316455696201, "percentage": 27.32, "elapsed_time": "8:10:49", "remaining_time": "21:45:55"}
581
+ {"current_steps": 245, "total_steps": 1230, "loss": 0.4209, "lr": 3.881318931821972e-05, "epoch": 0.9924050632911392, "percentage": 19.92, "elapsed_time": "6:00:22", "remaining_time": "1 day, 0:08:51"}
582
+ {"current_steps": 337, "total_steps": 1230, "loss": 0.3363, "lr": 3.642363201513657e-05, "epoch": 1.3665822784810127, "percentage": 27.4, "elapsed_time": "8:12:05", "remaining_time": "21:43:56"}
583
+ {"current_steps": 246, "total_steps": 1230, "loss": 0.412, "lr": 3.879385241571817e-05, "epoch": 0.9964556962025316, "percentage": 20.0, "elapsed_time": "6:01:43", "remaining_time": "1 day, 0:06:54"}
584
+ {"current_steps": 338, "total_steps": 1230, "loss": 0.3328, "lr": 3.6391175621373006e-05, "epoch": 1.3706329113924052, "percentage": 27.48, "elapsed_time": "8:13:27", "remaining_time": "21:42:14"}
585
+ {"current_steps": 339, "total_steps": 1230, "loss": 0.3492, "lr": 3.6358587215334355e-05, "epoch": 1.3746835443037975, "percentage": 27.56, "elapsed_time": "8:14:48", "remaining_time": "21:40:29"}
586
+ {"current_steps": 247, "total_steps": 1230, "loss": 0.3742, "lr": 3.8774364150112955e-05, "epoch": 1.0020253164556963, "percentage": 20.08, "elapsed_time": "6:04:01", "remaining_time": "1 day, 0:08:42"}
587
+ {"current_steps": 340, "total_steps": 1230, "loss": 0.3265, "lr": 3.632586705948318e-05, "epoch": 1.3787341772151898, "percentage": 27.64, "elapsed_time": "8:16:10", "remaining_time": "21:38:49"}
588
+ {"current_steps": 248, "total_steps": 1230, "loss": 0.3582, "lr": 3.8754724678359884e-05, "epoch": 1.0060759493670886, "percentage": 20.16, "elapsed_time": "6:05:29", "remaining_time": "1 day, 0:07:14"}
589
+ {"current_steps": 341, "total_steps": 1230, "loss": 0.3391, "lr": 3.629301541734311e-05, "epoch": 1.3827848101265823, "percentage": 27.72, "elapsed_time": "8:17:39", "remaining_time": "21:37:25"}
590
+ {"current_steps": 249, "total_steps": 1230, "loss": 0.3548, "lr": 3.873493415863256e-05, "epoch": 1.010126582278481, "percentage": 20.24, "elapsed_time": "6:07:06", "remaining_time": "1 day, 0:06:17"}
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2b109346f835356baa84e067fdb9a82cdcae7d60dd3739e1d9b7b4e6b1eca559
3
  size 7288
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fbfe2753ce890402118e13912d3877e6acebdd7767919752be931aea1065b060
3
  size 7288