Training in progress, epoch 4
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5f110d3d71121f5e495f6c55757fa9c487f1a75f52925882460a7381e556e0ee
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7f418b286a99e3e0ce10a180af9d36a744f091cafbfd46824d7b02e93fa525dc
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e528875b60853e33a68e182cc6094fbb078c7365cf37d91a3e3e076cdf7a3899
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0d5e89de1ce2577df33aba6cf71e36b90e7b2eea555587da02a378993e8938b7
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -744,3 +744,250 @@
|
|
| 744 |
{"current_steps": 744, "total_steps": 1235, "loss": 0.1798, "lr": 1.642806717162757e-05, "epoch": 3.012151898734177, "percentage": 60.24, "elapsed_time": "4:42:04", "remaining_time": "3:06:09"}
|
| 745 |
{"current_steps": 745, "total_steps": 1235, "loss": 0.1797, "lr": 1.637243646233718e-05, "epoch": 3.0162025316455696, "percentage": 60.32, "elapsed_time": "4:42:25", "remaining_time": "3:05:45"}
|
| 746 |
{"current_steps": 746, "total_steps": 1235, "loss": 0.1723, "lr": 1.6316834758948174e-05, "epoch": 3.020253164556962, "percentage": 60.4, "elapsed_time": "4:42:48", "remaining_time": "3:05:22"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 744 |
{"current_steps": 744, "total_steps": 1235, "loss": 0.1798, "lr": 1.642806717162757e-05, "epoch": 3.012151898734177, "percentage": 60.24, "elapsed_time": "4:42:04", "remaining_time": "3:06:09"}
|
| 745 |
{"current_steps": 745, "total_steps": 1235, "loss": 0.1797, "lr": 1.637243646233718e-05, "epoch": 3.0162025316455696, "percentage": 60.32, "elapsed_time": "4:42:25", "remaining_time": "3:05:45"}
|
| 746 |
{"current_steps": 746, "total_steps": 1235, "loss": 0.1723, "lr": 1.6316834758948174e-05, "epoch": 3.020253164556962, "percentage": 60.4, "elapsed_time": "4:42:48", "remaining_time": "3:05:22"}
|
| 747 |
+
{"current_steps": 747, "total_steps": 1235, "loss": 0.1742, "lr": 1.6261262506050282e-05, "epoch": 3.0243037974683546, "percentage": 60.49, "elapsed_time": "4:43:10", "remaining_time": "3:04:59"}
|
| 748 |
+
{"current_steps": 748, "total_steps": 1235, "loss": 0.1711, "lr": 1.620572014799777e-05, "epoch": 3.0283544303797467, "percentage": 60.57, "elapsed_time": "4:43:32", "remaining_time": "3:04:36"}
|
| 749 |
+
{"current_steps": 749, "total_steps": 1235, "loss": 0.1635, "lr": 1.6150208128905857e-05, "epoch": 3.0324050632911392, "percentage": 60.65, "elapsed_time": "4:43:55", "remaining_time": "3:04:13"}
|
| 750 |
+
{"current_steps": 750, "total_steps": 1235, "loss": 0.1717, "lr": 1.6094726892647147e-05, "epoch": 3.0364556962025318, "percentage": 60.73, "elapsed_time": "4:44:17", "remaining_time": "3:03:50"}
|
| 751 |
+
{"current_steps": 751, "total_steps": 1235, "loss": 0.1762, "lr": 1.6039276882848135e-05, "epoch": 3.0405063291139243, "percentage": 60.81, "elapsed_time": "4:44:40", "remaining_time": "3:03:27"}
|
| 752 |
+
{"current_steps": 752, "total_steps": 1235, "loss": 0.1735, "lr": 1.5983858542885635e-05, "epoch": 3.0445569620253163, "percentage": 60.89, "elapsed_time": "4:45:01", "remaining_time": "3:03:04"}
|
| 753 |
+
{"current_steps": 753, "total_steps": 1235, "loss": 0.1754, "lr": 1.5928472315883203e-05, "epoch": 3.048607594936709, "percentage": 60.97, "elapsed_time": "4:45:24", "remaining_time": "3:02:41"}
|
| 754 |
+
{"current_steps": 754, "total_steps": 1235, "loss": 0.1822, "lr": 1.5873118644707633e-05, "epoch": 3.0526582278481014, "percentage": 61.05, "elapsed_time": "4:45:45", "remaining_time": "3:02:17"}
|
| 755 |
+
{"current_steps": 755, "total_steps": 1235, "loss": 0.1821, "lr": 1.5817797971965413e-05, "epoch": 3.056708860759494, "percentage": 61.13, "elapsed_time": "4:46:09", "remaining_time": "3:01:55"}
|
| 756 |
+
{"current_steps": 756, "total_steps": 1235, "loss": 0.1682, "lr": 1.576251073999917e-05, "epoch": 3.060759493670886, "percentage": 61.21, "elapsed_time": "4:46:30", "remaining_time": "3:01:31"}
|
| 757 |
+
{"current_steps": 757, "total_steps": 1235, "loss": 0.1638, "lr": 1.5707257390884126e-05, "epoch": 3.0648101265822785, "percentage": 61.3, "elapsed_time": "4:46:51", "remaining_time": "3:01:08"}
|
| 758 |
+
{"current_steps": 758, "total_steps": 1235, "loss": 0.1663, "lr": 1.5652038366424595e-05, "epoch": 3.068860759493671, "percentage": 61.38, "elapsed_time": "4:47:13", "remaining_time": "3:00:44"}
|
| 759 |
+
{"current_steps": 759, "total_steps": 1235, "loss": 0.1715, "lr": 1.5596854108150424e-05, "epoch": 3.0729113924050635, "percentage": 61.46, "elapsed_time": "4:47:35", "remaining_time": "3:00:21"}
|
| 760 |
+
{"current_steps": 760, "total_steps": 1235, "loss": 0.1712, "lr": 1.5541705057313476e-05, "epoch": 3.0769620253164556, "percentage": 61.54, "elapsed_time": "4:48:00", "remaining_time": "3:00:00"}
|
| 761 |
+
{"current_steps": 761, "total_steps": 1235, "loss": 0.1718, "lr": 1.5486591654884086e-05, "epoch": 3.081012658227848, "percentage": 61.62, "elapsed_time": "4:48:21", "remaining_time": "2:59:36"}
|
| 762 |
+
{"current_steps": 762, "total_steps": 1235, "loss": 0.1778, "lr": 1.543151434154755e-05, "epoch": 3.0850632911392406, "percentage": 61.7, "elapsed_time": "4:48:43", "remaining_time": "2:59:13"}
|
| 763 |
+
{"current_steps": 763, "total_steps": 1235, "loss": 0.1802, "lr": 1.5376473557700615e-05, "epoch": 3.089113924050633, "percentage": 61.78, "elapsed_time": "4:49:06", "remaining_time": "2:58:50"}
|
| 764 |
+
{"current_steps": 764, "total_steps": 1235, "loss": 0.1749, "lr": 1.5321469743447893e-05, "epoch": 3.093164556962025, "percentage": 61.86, "elapsed_time": "4:49:29", "remaining_time": "2:58:27"}
|
| 765 |
+
{"current_steps": 765, "total_steps": 1235, "loss": 0.1722, "lr": 1.5266503338598434e-05, "epoch": 3.0972151898734177, "percentage": 61.94, "elapsed_time": "4:49:50", "remaining_time": "2:58:04"}
|
| 766 |
+
{"current_steps": 766, "total_steps": 1235, "loss": 0.1728, "lr": 1.5211574782662149e-05, "epoch": 3.1012658227848102, "percentage": 62.02, "elapsed_time": "4:50:14", "remaining_time": "2:57:42"}
|
| 767 |
+
{"current_steps": 767, "total_steps": 1235, "loss": 0.1695, "lr": 1.5156684514846307e-05, "epoch": 3.1053164556962027, "percentage": 62.11, "elapsed_time": "4:50:36", "remaining_time": "2:57:19"}
|
| 768 |
+
{"current_steps": 768, "total_steps": 1235, "loss": 0.1809, "lr": 1.5101832974052012e-05, "epoch": 3.109367088607595, "percentage": 62.19, "elapsed_time": "4:50:58", "remaining_time": "2:56:56"}
|
| 769 |
+
{"current_steps": 769, "total_steps": 1235, "loss": 0.18, "lr": 1.5047020598870737e-05, "epoch": 3.1134177215189873, "percentage": 62.27, "elapsed_time": "4:51:20", "remaining_time": "2:56:33"}
|
| 770 |
+
{"current_steps": 770, "total_steps": 1235, "loss": 0.1779, "lr": 1.4992247827580778e-05, "epoch": 3.11746835443038, "percentage": 62.35, "elapsed_time": "4:51:42", "remaining_time": "2:56:09"}
|
| 771 |
+
{"current_steps": 771, "total_steps": 1235, "loss": 0.1772, "lr": 1.493751509814374e-05, "epoch": 3.1215189873417724, "percentage": 62.43, "elapsed_time": "4:52:04", "remaining_time": "2:55:46"}
|
| 772 |
+
{"current_steps": 772, "total_steps": 1235, "loss": 0.1714, "lr": 1.4882822848201073e-05, "epoch": 3.1255696202531644, "percentage": 62.51, "elapsed_time": "4:52:27", "remaining_time": "2:55:23"}
|
| 773 |
+
{"current_steps": 773, "total_steps": 1235, "loss": 0.1776, "lr": 1.4828171515070553e-05, "epoch": 3.129620253164557, "percentage": 62.59, "elapsed_time": "4:52:49", "remaining_time": "2:55:00"}
|
| 774 |
+
{"current_steps": 774, "total_steps": 1235, "loss": 0.1567, "lr": 1.4773561535742793e-05, "epoch": 3.1336708860759495, "percentage": 62.67, "elapsed_time": "4:53:12", "remaining_time": "2:54:38"}
|
| 775 |
+
{"current_steps": 775, "total_steps": 1235, "loss": 0.1734, "lr": 1.4718993346877715e-05, "epoch": 3.137721518987342, "percentage": 62.75, "elapsed_time": "4:53:33", "remaining_time": "2:54:14"}
|
| 776 |
+
{"current_steps": 776, "total_steps": 1235, "loss": 0.1625, "lr": 1.466446738480111e-05, "epoch": 3.141772151898734, "percentage": 62.83, "elapsed_time": "4:53:56", "remaining_time": "2:53:51"}
|
| 777 |
+
{"current_steps": 777, "total_steps": 1235, "loss": 0.1775, "lr": 1.460998408550112e-05, "epoch": 3.1458227848101266, "percentage": 62.91, "elapsed_time": "4:54:20", "remaining_time": "2:53:29"}
|
| 778 |
+
{"current_steps": 778, "total_steps": 1235, "loss": 0.1679, "lr": 1.4555543884624751e-05, "epoch": 3.149873417721519, "percentage": 63.0, "elapsed_time": "4:54:42", "remaining_time": "2:53:06"}
|
| 779 |
+
{"current_steps": 779, "total_steps": 1235, "loss": 0.1673, "lr": 1.4501147217474402e-05, "epoch": 3.1539240506329116, "percentage": 63.08, "elapsed_time": "4:55:03", "remaining_time": "2:52:43"}
|
| 780 |
+
{"current_steps": 780, "total_steps": 1235, "loss": 0.1723, "lr": 1.444679451900437e-05, "epoch": 3.1579746835443037, "percentage": 63.16, "elapsed_time": "4:55:25", "remaining_time": "2:52:20"}
|
| 781 |
+
{"current_steps": 781, "total_steps": 1235, "loss": 0.173, "lr": 1.4392486223817397e-05, "epoch": 3.162025316455696, "percentage": 63.24, "elapsed_time": "4:55:49", "remaining_time": "2:51:57"}
|
| 782 |
+
{"current_steps": 782, "total_steps": 1235, "loss": 0.1805, "lr": 1.4338222766161143e-05, "epoch": 3.1660759493670887, "percentage": 63.32, "elapsed_time": "4:56:11", "remaining_time": "2:51:34"}
|
| 783 |
+
{"current_steps": 783, "total_steps": 1235, "loss": 0.1637, "lr": 1.4284004579924777e-05, "epoch": 3.170126582278481, "percentage": 63.4, "elapsed_time": "4:56:34", "remaining_time": "2:51:12"}
|
| 784 |
+
{"current_steps": 784, "total_steps": 1235, "loss": 0.1721, "lr": 1.4229832098635479e-05, "epoch": 3.1741772151898733, "percentage": 63.48, "elapsed_time": "4:56:56", "remaining_time": "2:50:49"}
|
| 785 |
+
{"current_steps": 785, "total_steps": 1235, "loss": 0.1679, "lr": 1.4175705755454963e-05, "epoch": 3.178227848101266, "percentage": 63.56, "elapsed_time": "4:57:17", "remaining_time": "2:50:25"}
|
| 786 |
+
{"current_steps": 786, "total_steps": 1235, "loss": 0.1725, "lr": 1.412162598317602e-05, "epoch": 3.1822784810126583, "percentage": 63.64, "elapsed_time": "4:57:40", "remaining_time": "2:50:02"}
|
| 787 |
+
{"current_steps": 787, "total_steps": 1235, "loss": 0.1722, "lr": 1.406759321421907e-05, "epoch": 3.186329113924051, "percentage": 63.72, "elapsed_time": "4:58:02", "remaining_time": "2:49:39"}
|
| 788 |
+
{"current_steps": 788, "total_steps": 1235, "loss": 0.1718, "lr": 1.401360788062871e-05, "epoch": 3.190379746835443, "percentage": 63.81, "elapsed_time": "4:58:26", "remaining_time": "2:49:17"}
|
| 789 |
+
{"current_steps": 789, "total_steps": 1235, "loss": 0.1649, "lr": 1.3959670414070204e-05, "epoch": 3.1944303797468354, "percentage": 63.89, "elapsed_time": "4:58:48", "remaining_time": "2:48:54"}
|
| 790 |
+
{"current_steps": 790, "total_steps": 1235, "loss": 0.1701, "lr": 1.3905781245826108e-05, "epoch": 3.198481012658228, "percentage": 63.97, "elapsed_time": "4:59:11", "remaining_time": "2:48:31"}
|
| 791 |
+
{"current_steps": 791, "total_steps": 1235, "loss": 0.1624, "lr": 1.3851940806792778e-05, "epoch": 3.2025316455696204, "percentage": 64.05, "elapsed_time": "4:59:32", "remaining_time": "2:48:08"}
|
| 792 |
+
{"current_steps": 792, "total_steps": 1235, "loss": 0.1696, "lr": 1.379814952747693e-05, "epoch": 3.2065822784810125, "percentage": 64.13, "elapsed_time": "4:59:55", "remaining_time": "2:47:45"}
|
| 793 |
+
{"current_steps": 793, "total_steps": 1235, "loss": 0.1762, "lr": 1.3744407837992193e-05, "epoch": 3.210632911392405, "percentage": 64.21, "elapsed_time": "5:00:16", "remaining_time": "2:47:22"}
|
| 794 |
+
{"current_steps": 794, "total_steps": 1235, "loss": 0.1723, "lr": 1.3690716168055692e-05, "epoch": 3.2146835443037975, "percentage": 64.29, "elapsed_time": "5:00:38", "remaining_time": "2:46:58"}
|
| 795 |
+
{"current_steps": 795, "total_steps": 1235, "loss": 0.1747, "lr": 1.363707494698459e-05, "epoch": 3.21873417721519, "percentage": 64.37, "elapsed_time": "5:01:01", "remaining_time": "2:46:36"}
|
| 796 |
+
{"current_steps": 796, "total_steps": 1235, "loss": 0.1648, "lr": 1.358348460369265e-05, "epoch": 3.222784810126582, "percentage": 64.45, "elapsed_time": "5:01:24", "remaining_time": "2:46:13"}
|
| 797 |
+
{"current_steps": 797, "total_steps": 1235, "loss": 0.176, "lr": 1.352994556668684e-05, "epoch": 3.2268354430379746, "percentage": 64.53, "elapsed_time": "5:01:47", "remaining_time": "2:45:51"}
|
| 798 |
+
{"current_steps": 798, "total_steps": 1235, "loss": 0.1646, "lr": 1.3476458264063865e-05, "epoch": 3.230886075949367, "percentage": 64.62, "elapsed_time": "5:02:10", "remaining_time": "2:45:28"}
|
| 799 |
+
{"current_steps": 799, "total_steps": 1235, "loss": 0.17, "lr": 1.342302312350678e-05, "epoch": 3.2349367088607597, "percentage": 64.7, "elapsed_time": "5:02:32", "remaining_time": "2:45:05"}
|
| 800 |
+
{"current_steps": 800, "total_steps": 1235, "loss": 0.1693, "lr": 1.3369640572281537e-05, "epoch": 3.2389873417721518, "percentage": 64.78, "elapsed_time": "5:02:56", "remaining_time": "2:44:43"}
|
| 801 |
+
{"current_steps": 801, "total_steps": 1235, "loss": 0.1719, "lr": 1.3316311037233596e-05, "epoch": 3.2430379746835443, "percentage": 64.86, "elapsed_time": "5:03:17", "remaining_time": "2:44:19"}
|
| 802 |
+
{"current_steps": 802, "total_steps": 1235, "loss": 0.1734, "lr": 1.326303494478451e-05, "epoch": 3.247088607594937, "percentage": 64.94, "elapsed_time": "5:03:40", "remaining_time": "2:43:57"}
|
| 803 |
+
{"current_steps": 803, "total_steps": 1235, "loss": 0.1756, "lr": 1.3209812720928472e-05, "epoch": 3.2511392405063293, "percentage": 65.02, "elapsed_time": "5:04:03", "remaining_time": "2:43:34"}
|
| 804 |
+
{"current_steps": 804, "total_steps": 1235, "loss": 0.1738, "lr": 1.315664479122898e-05, "epoch": 3.2551898734177214, "percentage": 65.1, "elapsed_time": "5:04:26", "remaining_time": "2:43:11"}
|
| 805 |
+
{"current_steps": 805, "total_steps": 1235, "loss": 0.1752, "lr": 1.3103531580815378e-05, "epoch": 3.259240506329114, "percentage": 65.18, "elapsed_time": "5:04:49", "remaining_time": "2:42:49"}
|
| 806 |
+
{"current_steps": 806, "total_steps": 1235, "loss": 0.1706, "lr": 1.3050473514379488e-05, "epoch": 3.2632911392405064, "percentage": 65.26, "elapsed_time": "5:05:11", "remaining_time": "2:42:26"}
|
| 807 |
+
{"current_steps": 807, "total_steps": 1235, "loss": 0.1715, "lr": 1.2997471016172188e-05, "epoch": 3.267341772151899, "percentage": 65.34, "elapsed_time": "5:05:34", "remaining_time": "2:42:03"}
|
| 808 |
+
{"current_steps": 808, "total_steps": 1235, "loss": 0.1678, "lr": 1.2944524510000042e-05, "epoch": 3.271392405063291, "percentage": 65.43, "elapsed_time": "5:05:57", "remaining_time": "2:41:41"}
|
| 809 |
+
{"current_steps": 809, "total_steps": 1235, "loss": 0.1798, "lr": 1.2891634419221908e-05, "epoch": 3.2754430379746835, "percentage": 65.51, "elapsed_time": "5:06:19", "remaining_time": "2:41:18"}
|
| 810 |
+
{"current_steps": 810, "total_steps": 1235, "loss": 0.1717, "lr": 1.2838801166745545e-05, "epoch": 3.279493670886076, "percentage": 65.59, "elapsed_time": "5:06:43", "remaining_time": "2:40:56"}
|
| 811 |
+
{"current_steps": 811, "total_steps": 1235, "loss": 0.172, "lr": 1.2786025175024216e-05, "epoch": 3.2835443037974685, "percentage": 65.67, "elapsed_time": "5:07:05", "remaining_time": "2:40:32"}
|
| 812 |
+
{"current_steps": 812, "total_steps": 1235, "loss": 0.1786, "lr": 1.2733306866053357e-05, "epoch": 3.2875949367088606, "percentage": 65.75, "elapsed_time": "5:07:28", "remaining_time": "2:40:10"}
|
| 813 |
+
{"current_steps": 813, "total_steps": 1235, "loss": 0.1779, "lr": 1.2680646661367163e-05, "epoch": 3.291645569620253, "percentage": 65.83, "elapsed_time": "5:07:53", "remaining_time": "2:39:48"}
|
| 814 |
+
{"current_steps": 814, "total_steps": 1235, "loss": 0.1715, "lr": 1.2628044982035219e-05, "epoch": 3.2956962025316456, "percentage": 65.91, "elapsed_time": "5:08:14", "remaining_time": "2:39:25"}
|
| 815 |
+
{"current_steps": 815, "total_steps": 1235, "loss": 0.1737, "lr": 1.2575502248659155e-05, "epoch": 3.299746835443038, "percentage": 65.99, "elapsed_time": "5:08:35", "remaining_time": "2:39:01"}
|
| 816 |
+
{"current_steps": 816, "total_steps": 1235, "loss": 0.1747, "lr": 1.2523018881369269e-05, "epoch": 3.3037974683544302, "percentage": 66.07, "elapsed_time": "5:08:59", "remaining_time": "2:38:39"}
|
| 817 |
+
{"current_steps": 817, "total_steps": 1235, "loss": 0.1729, "lr": 1.2470595299821176e-05, "epoch": 3.3078481012658227, "percentage": 66.15, "elapsed_time": "5:09:20", "remaining_time": "2:38:16"}
|
| 818 |
+
{"current_steps": 818, "total_steps": 1235, "loss": 0.1725, "lr": 1.2418231923192416e-05, "epoch": 3.3118987341772153, "percentage": 66.23, "elapsed_time": "5:09:43", "remaining_time": "2:37:53"}
|
| 819 |
+
{"current_steps": 819, "total_steps": 1235, "loss": 0.1658, "lr": 1.2365929170179165e-05, "epoch": 3.3159493670886078, "percentage": 66.32, "elapsed_time": "5:10:06", "remaining_time": "2:37:31"}
|
| 820 |
+
{"current_steps": 820, "total_steps": 1235, "loss": 0.1682, "lr": 1.2313687458992848e-05, "epoch": 3.32, "percentage": 66.4, "elapsed_time": "5:10:29", "remaining_time": "2:37:08"}
|
| 821 |
+
{"current_steps": 821, "total_steps": 1235, "loss": 0.1667, "lr": 1.2261507207356785e-05, "epoch": 3.3240506329113924, "percentage": 66.48, "elapsed_time": "5:10:50", "remaining_time": "2:36:44"}
|
| 822 |
+
{"current_steps": 822, "total_steps": 1235, "loss": 0.1779, "lr": 1.220938883250288e-05, "epoch": 3.328101265822785, "percentage": 66.56, "elapsed_time": "5:11:13", "remaining_time": "2:36:22"}
|
| 823 |
+
{"current_steps": 823, "total_steps": 1235, "loss": 0.1644, "lr": 1.215733275116827e-05, "epoch": 3.3321518987341774, "percentage": 66.64, "elapsed_time": "5:11:35", "remaining_time": "2:35:59"}
|
| 824 |
+
{"current_steps": 824, "total_steps": 1235, "loss": 0.1754, "lr": 1.2105339379592005e-05, "epoch": 3.3362025316455695, "percentage": 66.72, "elapsed_time": "5:11:57", "remaining_time": "2:35:36"}
|
| 825 |
+
{"current_steps": 825, "total_steps": 1235, "loss": 0.1691, "lr": 1.2053409133511681e-05, "epoch": 3.340253164556962, "percentage": 66.8, "elapsed_time": "5:12:20", "remaining_time": "2:35:13"}
|
| 826 |
+
{"current_steps": 826, "total_steps": 1235, "loss": 0.1668, "lr": 1.2001542428160173e-05, "epoch": 3.3443037974683545, "percentage": 66.88, "elapsed_time": "5:12:43", "remaining_time": "2:34:51"}
|
| 827 |
+
{"current_steps": 827, "total_steps": 1235, "loss": 0.159, "lr": 1.1949739678262278e-05, "epoch": 3.348354430379747, "percentage": 66.96, "elapsed_time": "5:13:04", "remaining_time": "2:34:27"}
|
| 828 |
+
{"current_steps": 828, "total_steps": 1235, "loss": 0.1652, "lr": 1.189800129803139e-05, "epoch": 3.352405063291139, "percentage": 67.04, "elapsed_time": "5:13:27", "remaining_time": "2:34:04"}
|
| 829 |
+
{"current_steps": 829, "total_steps": 1235, "loss": 0.1662, "lr": 1.1846327701166228e-05, "epoch": 3.3564556962025316, "percentage": 67.13, "elapsed_time": "5:13:48", "remaining_time": "2:33:41"}
|
| 830 |
+
{"current_steps": 830, "total_steps": 1235, "loss": 0.1706, "lr": 1.1794719300847493e-05, "epoch": 3.360506329113924, "percentage": 67.21, "elapsed_time": "5:14:11", "remaining_time": "2:33:18"}
|
| 831 |
+
{"current_steps": 831, "total_steps": 1235, "loss": 0.1635, "lr": 1.1743176509734582e-05, "epoch": 3.3645569620253166, "percentage": 67.29, "elapsed_time": "5:14:34", "remaining_time": "2:32:56"}
|
| 832 |
+
{"current_steps": 832, "total_steps": 1235, "loss": 0.1711, "lr": 1.1691699739962275e-05, "epoch": 3.3686075949367087, "percentage": 67.37, "elapsed_time": "5:14:56", "remaining_time": "2:32:32"}
|
| 833 |
+
{"current_steps": 833, "total_steps": 1235, "loss": 0.1617, "lr": 1.1640289403137456e-05, "epoch": 3.372658227848101, "percentage": 67.45, "elapsed_time": "5:15:19", "remaining_time": "2:32:10"}
|
| 834 |
+
{"current_steps": 834, "total_steps": 1235, "loss": 0.1661, "lr": 1.1588945910335802e-05, "epoch": 3.3767088607594937, "percentage": 67.53, "elapsed_time": "5:15:42", "remaining_time": "2:31:47"}
|
| 835 |
+
{"current_steps": 835, "total_steps": 1235, "loss": 0.168, "lr": 1.1537669672098517e-05, "epoch": 3.3807594936708862, "percentage": 67.61, "elapsed_time": "5:16:05", "remaining_time": "2:31:25"}
|
| 836 |
+
{"current_steps": 836, "total_steps": 1235, "loss": 0.1749, "lr": 1.1486461098429036e-05, "epoch": 3.3848101265822783, "percentage": 67.69, "elapsed_time": "5:16:27", "remaining_time": "2:31:02"}
|
| 837 |
+
{"current_steps": 837, "total_steps": 1235, "loss": 0.181, "lr": 1.1435320598789747e-05, "epoch": 3.388860759493671, "percentage": 67.77, "elapsed_time": "5:16:48", "remaining_time": "2:30:38"}
|
| 838 |
+
{"current_steps": 838, "total_steps": 1235, "loss": 0.1696, "lr": 1.1384248582098736e-05, "epoch": 3.3929113924050633, "percentage": 67.85, "elapsed_time": "5:17:10", "remaining_time": "2:30:15"}
|
| 839 |
+
{"current_steps": 839, "total_steps": 1235, "loss": 0.1722, "lr": 1.1333245456726467e-05, "epoch": 3.396962025316456, "percentage": 67.94, "elapsed_time": "5:17:32", "remaining_time": "2:29:52"}
|
| 840 |
+
{"current_steps": 840, "total_steps": 1235, "loss": 0.1731, "lr": 1.128231163049258e-05, "epoch": 3.401012658227848, "percentage": 68.02, "elapsed_time": "5:17:53", "remaining_time": "2:29:29"}
|
| 841 |
+
{"current_steps": 841, "total_steps": 1235, "loss": 0.1746, "lr": 1.123144751066259e-05, "epoch": 3.4050632911392404, "percentage": 68.1, "elapsed_time": "5:18:15", "remaining_time": "2:29:05"}
|
| 842 |
+
{"current_steps": 842, "total_steps": 1235, "loss": 0.1723, "lr": 1.1180653503944657e-05, "epoch": 3.409113924050633, "percentage": 68.18, "elapsed_time": "5:18:37", "remaining_time": "2:28:42"}
|
| 843 |
+
{"current_steps": 843, "total_steps": 1235, "loss": 0.1712, "lr": 1.1129930016486287e-05, "epoch": 3.4131645569620255, "percentage": 68.26, "elapsed_time": "5:18:59", "remaining_time": "2:28:19"}
|
| 844 |
+
{"current_steps": 844, "total_steps": 1235, "loss": 0.1707, "lr": 1.107927745387114e-05, "epoch": 3.4172151898734175, "percentage": 68.34, "elapsed_time": "5:19:21", "remaining_time": "2:27:57"}
|
| 845 |
+
{"current_steps": 845, "total_steps": 1235, "loss": 0.1731, "lr": 1.1028696221115766e-05, "epoch": 3.42126582278481, "percentage": 68.42, "elapsed_time": "5:19:43", "remaining_time": "2:27:34"}
|
| 846 |
+
{"current_steps": 846, "total_steps": 1235, "loss": 0.1696, "lr": 1.0978186722666341e-05, "epoch": 3.4253164556962026, "percentage": 68.5, "elapsed_time": "5:20:05", "remaining_time": "2:27:10"}
|
| 847 |
+
{"current_steps": 847, "total_steps": 1235, "loss": 0.1726, "lr": 1.0927749362395475e-05, "epoch": 3.429367088607595, "percentage": 68.58, "elapsed_time": "5:20:27", "remaining_time": "2:26:47"}
|
| 848 |
+
{"current_steps": 848, "total_steps": 1235, "loss": 0.1774, "lr": 1.0877384543598954e-05, "epoch": 3.433417721518987, "percentage": 68.66, "elapsed_time": "5:20:49", "remaining_time": "2:26:24"}
|
| 849 |
+
{"current_steps": 849, "total_steps": 1235, "loss": 0.178, "lr": 1.0827092668992529e-05, "epoch": 3.4374683544303797, "percentage": 68.74, "elapsed_time": "5:21:13", "remaining_time": "2:26:02"}
|
| 850 |
+
{"current_steps": 850, "total_steps": 1235, "loss": 0.1687, "lr": 1.077687414070869e-05, "epoch": 3.441518987341772, "percentage": 68.83, "elapsed_time": "5:21:36", "remaining_time": "2:25:40"}
|
| 851 |
+
{"current_steps": 851, "total_steps": 1235, "loss": 0.1698, "lr": 1.0726729360293451e-05, "epoch": 3.4455696202531647, "percentage": 68.91, "elapsed_time": "5:22:00", "remaining_time": "2:25:18"}
|
| 852 |
+
{"current_steps": 852, "total_steps": 1235, "loss": 0.1628, "lr": 1.0676658728703147e-05, "epoch": 3.449620253164557, "percentage": 68.99, "elapsed_time": "5:22:23", "remaining_time": "2:24:55"}
|
| 853 |
+
{"current_steps": 853, "total_steps": 1235, "loss": 0.1716, "lr": 1.0626662646301198e-05, "epoch": 3.4536708860759493, "percentage": 69.07, "elapsed_time": "5:22:48", "remaining_time": "2:24:33"}
|
| 854 |
+
{"current_steps": 854, "total_steps": 1235, "loss": 0.1697, "lr": 1.0576741512854958e-05, "epoch": 3.457721518987342, "percentage": 69.15, "elapsed_time": "5:23:12", "remaining_time": "2:24:11"}
|
| 855 |
+
{"current_steps": 855, "total_steps": 1235, "loss": 0.1725, "lr": 1.052689572753247e-05, "epoch": 3.4617721518987343, "percentage": 69.23, "elapsed_time": "5:23:33", "remaining_time": "2:23:48"}
|
| 856 |
+
{"current_steps": 856, "total_steps": 1235, "loss": 0.1692, "lr": 1.0477125688899328e-05, "epoch": 3.4658227848101264, "percentage": 69.31, "elapsed_time": "5:23:56", "remaining_time": "2:23:25"}
|
| 857 |
+
{"current_steps": 857, "total_steps": 1235, "loss": 0.1619, "lr": 1.0427431794915406e-05, "epoch": 3.469873417721519, "percentage": 69.39, "elapsed_time": "5:24:19", "remaining_time": "2:23:02"}
|
| 858 |
+
{"current_steps": 858, "total_steps": 1235, "loss": 0.1707, "lr": 1.0377814442931769e-05, "epoch": 3.4739240506329114, "percentage": 69.47, "elapsed_time": "5:24:40", "remaining_time": "2:22:39"}
|
| 859 |
+
{"current_steps": 859, "total_steps": 1235, "loss": 0.1753, "lr": 1.0328274029687439e-05, "epoch": 3.477974683544304, "percentage": 69.55, "elapsed_time": "5:25:02", "remaining_time": "2:22:16"}
|
| 860 |
+
{"current_steps": 860, "total_steps": 1235, "loss": 0.1658, "lr": 1.0278810951306253e-05, "epoch": 3.482025316455696, "percentage": 69.64, "elapsed_time": "5:25:25", "remaining_time": "2:21:53"}
|
| 861 |
+
{"current_steps": 861, "total_steps": 1235, "loss": 0.1673, "lr": 1.0229425603293647e-05, "epoch": 3.4860759493670885, "percentage": 69.72, "elapsed_time": "5:25:47", "remaining_time": "2:21:31"}
|
| 862 |
+
{"current_steps": 862, "total_steps": 1235, "loss": 0.1765, "lr": 1.0180118380533558e-05, "epoch": 3.490126582278481, "percentage": 69.8, "elapsed_time": "5:26:10", "remaining_time": "2:21:08"}
|
| 863 |
+
{"current_steps": 863, "total_steps": 1235, "loss": 0.1702, "lr": 1.0130889677285225e-05, "epoch": 3.4941772151898736, "percentage": 69.88, "elapsed_time": "5:26:31", "remaining_time": "2:20:44"}
|
| 864 |
+
{"current_steps": 864, "total_steps": 1235, "loss": 0.1736, "lr": 1.008173988718005e-05, "epoch": 3.4982278481012656, "percentage": 69.96, "elapsed_time": "5:26:53", "remaining_time": "2:20:22"}
|
| 865 |
+
{"current_steps": 865, "total_steps": 1235, "loss": 0.1706, "lr": 1.0032669403218439e-05, "epoch": 3.502278481012658, "percentage": 70.04, "elapsed_time": "5:27:16", "remaining_time": "2:19:59"}
|
| 866 |
+
{"current_steps": 866, "total_steps": 1235, "loss": 0.1741, "lr": 9.983678617766677e-06, "epoch": 3.5063291139240507, "percentage": 70.12, "elapsed_time": "5:27:38", "remaining_time": "2:19:36"}
|
| 867 |
+
{"current_steps": 867, "total_steps": 1235, "loss": 0.1683, "lr": 9.934767922553788e-06, "epoch": 3.510379746835443, "percentage": 70.2, "elapsed_time": "5:27:59", "remaining_time": "2:19:13"}
|
| 868 |
+
{"current_steps": 868, "total_steps": 1235, "loss": 0.1724, "lr": 9.885937708668371e-06, "epoch": 3.5144303797468357, "percentage": 70.28, "elapsed_time": "5:28:21", "remaining_time": "2:18:49"}
|
| 869 |
+
{"current_steps": 869, "total_steps": 1235, "loss": 0.1703, "lr": 9.837188366555524e-06, "epoch": 3.5184810126582278, "percentage": 70.36, "elapsed_time": "5:28:43", "remaining_time": "2:18:27"}
|
| 870 |
+
{"current_steps": 870, "total_steps": 1235, "loss": 0.1707, "lr": 9.788520286013691e-06, "epoch": 3.5225316455696203, "percentage": 70.45, "elapsed_time": "5:29:05", "remaining_time": "2:18:03"}
|
| 871 |
+
{"current_steps": 871, "total_steps": 1235, "loss": 0.1753, "lr": 9.739933856191537e-06, "epoch": 3.526582278481013, "percentage": 70.53, "elapsed_time": "5:29:28", "remaining_time": "2:17:41"}
|
| 872 |
+
{"current_steps": 872, "total_steps": 1235, "loss": 0.1716, "lr": 9.691429465584866e-06, "epoch": 3.530632911392405, "percentage": 70.61, "elapsed_time": "5:29:50", "remaining_time": "2:17:18"}
|
| 873 |
+
{"current_steps": 873, "total_steps": 1235, "loss": 0.1644, "lr": 9.643007502033492e-06, "epoch": 3.5346835443037974, "percentage": 70.69, "elapsed_time": "5:30:12", "remaining_time": "2:16:55"}
|
| 874 |
+
{"current_steps": 874, "total_steps": 1235, "loss": 0.1774, "lr": 9.594668352718152e-06, "epoch": 3.53873417721519, "percentage": 70.77, "elapsed_time": "5:30:34", "remaining_time": "2:16:32"}
|
| 875 |
+
{"current_steps": 875, "total_steps": 1235, "loss": 0.1707, "lr": 9.546412404157383e-06, "epoch": 3.5427848101265824, "percentage": 70.85, "elapsed_time": "5:30:56", "remaining_time": "2:16:09"}
|
| 876 |
+
{"current_steps": 876, "total_steps": 1235, "loss": 0.1826, "lr": 9.498240042204471e-06, "epoch": 3.546835443037975, "percentage": 70.93, "elapsed_time": "5:31:18", "remaining_time": "2:15:46"}
|
| 877 |
+
{"current_steps": 877, "total_steps": 1235, "loss": 0.1682, "lr": 9.450151652044339e-06, "epoch": 3.550886075949367, "percentage": 71.01, "elapsed_time": "5:31:42", "remaining_time": "2:15:24"}
|
| 878 |
+
{"current_steps": 878, "total_steps": 1235, "loss": 0.1752, "lr": 9.402147618190472e-06, "epoch": 3.5549367088607595, "percentage": 71.09, "elapsed_time": "5:32:02", "remaining_time": "2:15:00"}
|
| 879 |
+
{"current_steps": 879, "total_steps": 1235, "loss": 0.1678, "lr": 9.354228324481841e-06, "epoch": 3.558987341772152, "percentage": 71.17, "elapsed_time": "5:32:24", "remaining_time": "2:14:37"}
|
| 880 |
+
{"current_steps": 880, "total_steps": 1235, "loss": 0.1763, "lr": 9.306394154079852e-06, "epoch": 3.563037974683544, "percentage": 71.26, "elapsed_time": "5:32:46", "remaining_time": "2:14:14"}
|
| 881 |
+
{"current_steps": 881, "total_steps": 1235, "loss": 0.17, "lr": 9.258645489465254e-06, "epoch": 3.5670886075949366, "percentage": 71.34, "elapsed_time": "5:33:08", "remaining_time": "2:13:51"}
|
| 882 |
+
{"current_steps": 882, "total_steps": 1235, "loss": 0.178, "lr": 9.21098271243509e-06, "epoch": 3.571139240506329, "percentage": 71.42, "elapsed_time": "5:33:29", "remaining_time": "2:13:28"}
|
| 883 |
+
{"current_steps": 883, "total_steps": 1235, "loss": 0.1708, "lr": 9.163406204099659e-06, "epoch": 3.5751898734177217, "percentage": 71.5, "elapsed_time": "5:33:51", "remaining_time": "2:13:05"}
|
| 884 |
+
{"current_steps": 884, "total_steps": 1235, "loss": 0.158, "lr": 9.115916344879452e-06, "epoch": 3.579240506329114, "percentage": 71.58, "elapsed_time": "5:34:14", "remaining_time": "2:12:42"}
|
| 885 |
+
{"current_steps": 885, "total_steps": 1235, "loss": 0.1807, "lr": 9.068513514502126e-06, "epoch": 3.5832911392405062, "percentage": 71.66, "elapsed_time": "5:34:34", "remaining_time": "2:12:19"}
|
| 886 |
+
{"current_steps": 886, "total_steps": 1235, "loss": 0.1725, "lr": 9.021198091999439e-06, "epoch": 3.5873417721518988, "percentage": 71.74, "elapsed_time": "5:34:57", "remaining_time": "2:11:56"}
|
| 887 |
+
{"current_steps": 887, "total_steps": 1235, "loss": 0.1787, "lr": 8.973970455704251e-06, "epoch": 3.5913924050632913, "percentage": 71.82, "elapsed_time": "5:35:19", "remaining_time": "2:11:33"}
|
| 888 |
+
{"current_steps": 888, "total_steps": 1235, "loss": 0.1633, "lr": 8.926830983247495e-06, "epoch": 3.5954430379746833, "percentage": 71.9, "elapsed_time": "5:35:41", "remaining_time": "2:11:10"}
|
| 889 |
+
{"current_steps": 889, "total_steps": 1235, "loss": 0.1656, "lr": 8.879780051555116e-06, "epoch": 3.599493670886076, "percentage": 71.98, "elapsed_time": "5:36:03", "remaining_time": "2:10:47"}
|
| 890 |
+
{"current_steps": 890, "total_steps": 1235, "loss": 0.1776, "lr": 8.83281803684512e-06, "epoch": 3.6035443037974684, "percentage": 72.06, "elapsed_time": "5:36:25", "remaining_time": "2:10:24"}
|
| 891 |
+
{"current_steps": 891, "total_steps": 1235, "loss": 0.1697, "lr": 8.785945314624532e-06, "epoch": 3.607594936708861, "percentage": 72.15, "elapsed_time": "5:36:46", "remaining_time": "2:10:01"}
|
| 892 |
+
{"current_steps": 892, "total_steps": 1235, "loss": 0.1756, "lr": 8.739162259686385e-06, "epoch": 3.6116455696202534, "percentage": 72.23, "elapsed_time": "5:37:08", "remaining_time": "2:09:38"}
|
| 893 |
+
{"current_steps": 893, "total_steps": 1235, "loss": 0.1774, "lr": 8.692469246106734e-06, "epoch": 3.6156962025316455, "percentage": 72.31, "elapsed_time": "5:37:31", "remaining_time": "2:09:15"}
|
| 894 |
+
{"current_steps": 894, "total_steps": 1235, "loss": 0.1716, "lr": 8.645866647241677e-06, "epoch": 3.619746835443038, "percentage": 72.39, "elapsed_time": "5:37:54", "remaining_time": "2:08:53"}
|
| 895 |
+
{"current_steps": 895, "total_steps": 1235, "loss": 0.1719, "lr": 8.599354835724348e-06, "epoch": 3.6237974683544305, "percentage": 72.47, "elapsed_time": "5:38:16", "remaining_time": "2:08:30"}
|
| 896 |
+
{"current_steps": 896, "total_steps": 1235, "loss": 0.1647, "lr": 8.552934183461958e-06, "epoch": 3.6278481012658226, "percentage": 72.55, "elapsed_time": "5:38:38", "remaining_time": "2:08:07"}
|
| 897 |
+
{"current_steps": 897, "total_steps": 1235, "loss": 0.1717, "lr": 8.506605061632805e-06, "epoch": 3.631898734177215, "percentage": 72.63, "elapsed_time": "5:39:00", "remaining_time": "2:07:44"}
|
| 898 |
+
{"current_steps": 898, "total_steps": 1235, "loss": 0.1638, "lr": 8.460367840683308e-06, "epoch": 3.6359493670886076, "percentage": 72.71, "elapsed_time": "5:39:23", "remaining_time": "2:07:21"}
|
| 899 |
+
{"current_steps": 899, "total_steps": 1235, "loss": 0.1712, "lr": 8.414222890325065e-06, "epoch": 3.64, "percentage": 72.79, "elapsed_time": "5:39:46", "remaining_time": "2:06:59"}
|
| 900 |
+
{"current_steps": 900, "total_steps": 1235, "loss": 0.1731, "lr": 8.368170579531855e-06, "epoch": 3.6440506329113926, "percentage": 72.87, "elapsed_time": "5:40:09", "remaining_time": "2:06:36"}
|
| 901 |
+
{"current_steps": 901, "total_steps": 1235, "loss": 0.1734, "lr": 8.322211276536733e-06, "epoch": 3.6481012658227847, "percentage": 72.96, "elapsed_time": "5:40:32", "remaining_time": "2:06:14"}
|
| 902 |
+
{"current_steps": 902, "total_steps": 1235, "loss": 0.1686, "lr": 8.27634534882907e-06, "epoch": 3.6521518987341772, "percentage": 73.04, "elapsed_time": "5:40:54", "remaining_time": "2:05:51"}
|
| 903 |
+
{"current_steps": 903, "total_steps": 1235, "loss": 0.1746, "lr": 8.230573163151585e-06, "epoch": 3.6562025316455697, "percentage": 73.12, "elapsed_time": "5:41:17", "remaining_time": "2:05:28"}
|
| 904 |
+
{"current_steps": 904, "total_steps": 1235, "loss": 0.1635, "lr": 8.184895085497466e-06, "epoch": 3.660253164556962, "percentage": 73.2, "elapsed_time": "5:41:40", "remaining_time": "2:05:06"}
|
| 905 |
+
{"current_steps": 905, "total_steps": 1235, "loss": 0.1602, "lr": 8.139311481107401e-06, "epoch": 3.6643037974683543, "percentage": 73.28, "elapsed_time": "5:42:02", "remaining_time": "2:04:43"}
|
| 906 |
+
{"current_steps": 906, "total_steps": 1235, "loss": 0.1768, "lr": 8.093822714466686e-06, "epoch": 3.668354430379747, "percentage": 73.36, "elapsed_time": "5:42:26", "remaining_time": "2:04:21"}
|
| 907 |
+
{"current_steps": 907, "total_steps": 1235, "loss": 0.1683, "lr": 8.048429149302271e-06, "epoch": 3.6724050632911394, "percentage": 73.44, "elapsed_time": "5:42:49", "remaining_time": "2:03:58"}
|
| 908 |
+
{"current_steps": 908, "total_steps": 1235, "loss": 0.1873, "lr": 8.003131148579902e-06, "epoch": 3.676455696202532, "percentage": 73.52, "elapsed_time": "5:43:13", "remaining_time": "2:03:36"}
|
| 909 |
+
{"current_steps": 909, "total_steps": 1235, "loss": 0.167, "lr": 7.957929074501182e-06, "epoch": 3.680506329113924, "percentage": 73.6, "elapsed_time": "5:43:36", "remaining_time": "2:03:13"}
|
| 910 |
+
{"current_steps": 910, "total_steps": 1235, "loss": 0.1675, "lr": 7.912823288500695e-06, "epoch": 3.6845569620253165, "percentage": 73.68, "elapsed_time": "5:43:59", "remaining_time": "2:02:51"}
|
| 911 |
+
{"current_steps": 911, "total_steps": 1235, "loss": 0.1705, "lr": 7.867814151243102e-06, "epoch": 3.688607594936709, "percentage": 73.77, "elapsed_time": "5:44:23", "remaining_time": "2:02:28"}
|
| 912 |
+
{"current_steps": 912, "total_steps": 1235, "loss": 0.1703, "lr": 7.822902022620267e-06, "epoch": 3.692658227848101, "percentage": 73.85, "elapsed_time": "5:44:44", "remaining_time": "2:02:05"}
|
| 913 |
+
{"current_steps": 913, "total_steps": 1235, "loss": 0.1774, "lr": 7.778087261748377e-06, "epoch": 3.6967088607594936, "percentage": 73.93, "elapsed_time": "5:45:06", "remaining_time": "2:01:42"}
|
| 914 |
+
{"current_steps": 914, "total_steps": 1235, "loss": 0.1746, "lr": 7.733370226965056e-06, "epoch": 3.700759493670886, "percentage": 74.01, "elapsed_time": "5:45:29", "remaining_time": "2:01:20"}
|
| 915 |
+
{"current_steps": 915, "total_steps": 1235, "loss": 0.1716, "lr": 7.688751275826527e-06, "epoch": 3.7048101265822786, "percentage": 74.09, "elapsed_time": "5:45:52", "remaining_time": "2:00:57"}
|
| 916 |
+
{"current_steps": 916, "total_steps": 1235, "loss": 0.1615, "lr": 7.644230765104735e-06, "epoch": 3.708860759493671, "percentage": 74.17, "elapsed_time": "5:46:15", "remaining_time": "2:00:35"}
|
| 917 |
+
{"current_steps": 917, "total_steps": 1235, "loss": 0.1635, "lr": 7.599809050784502e-06, "epoch": 3.712911392405063, "percentage": 74.25, "elapsed_time": "5:46:36", "remaining_time": "2:00:11"}
|
| 918 |
+
{"current_steps": 918, "total_steps": 1235, "loss": 0.1695, "lr": 7.555486488060661e-06, "epoch": 3.7169620253164557, "percentage": 74.33, "elapsed_time": "5:46:58", "remaining_time": "1:59:48"}
|
| 919 |
+
{"current_steps": 919, "total_steps": 1235, "loss": 0.1715, "lr": 7.511263431335249e-06, "epoch": 3.721012658227848, "percentage": 74.41, "elapsed_time": "5:47:20", "remaining_time": "1:59:26"}
|
| 920 |
+
{"current_steps": 920, "total_steps": 1235, "loss": 0.1695, "lr": 7.467140234214656e-06, "epoch": 3.7250632911392403, "percentage": 74.49, "elapsed_time": "5:47:43", "remaining_time": "1:59:03"}
|
| 921 |
+
{"current_steps": 921, "total_steps": 1235, "loss": 0.1735, "lr": 7.423117249506777e-06, "epoch": 3.729113924050633, "percentage": 74.57, "elapsed_time": "5:48:06", "remaining_time": "1:58:40"}
|
| 922 |
+
{"current_steps": 922, "total_steps": 1235, "loss": 0.1636, "lr": 7.379194829218231e-06, "epoch": 3.7331645569620253, "percentage": 74.66, "elapsed_time": "5:48:27", "remaining_time": "1:58:17"}
|
| 923 |
+
{"current_steps": 923, "total_steps": 1235, "loss": 0.1756, "lr": 7.335373324551518e-06, "epoch": 3.737215189873418, "percentage": 74.74, "elapsed_time": "5:48:50", "remaining_time": "1:57:54"}
|
| 924 |
+
{"current_steps": 924, "total_steps": 1235, "loss": 0.1733, "lr": 7.291653085902224e-06, "epoch": 3.7412658227848103, "percentage": 74.82, "elapsed_time": "5:49:11", "remaining_time": "1:57:31"}
|
| 925 |
+
{"current_steps": 925, "total_steps": 1235, "loss": 0.1679, "lr": 7.248034462856213e-06, "epoch": 3.7453164556962024, "percentage": 74.9, "elapsed_time": "5:49:32", "remaining_time": "1:57:08"}
|
| 926 |
+
{"current_steps": 926, "total_steps": 1235, "loss": 0.1656, "lr": 7.20451780418683e-06, "epoch": 3.749367088607595, "percentage": 74.98, "elapsed_time": "5:49:54", "remaining_time": "1:56:45"}
|
| 927 |
+
{"current_steps": 927, "total_steps": 1235, "loss": 0.1653, "lr": 7.161103457852128e-06, "epoch": 3.7534177215189874, "percentage": 75.06, "elapsed_time": "5:50:16", "remaining_time": "1:56:22"}
|
| 928 |
+
{"current_steps": 928, "total_steps": 1235, "loss": 0.169, "lr": 7.117791770992046e-06, "epoch": 3.7574683544303795, "percentage": 75.14, "elapsed_time": "5:50:39", "remaining_time": "1:56:00"}
|
| 929 |
+
{"current_steps": 929, "total_steps": 1235, "loss": 0.182, "lr": 7.074583089925688e-06, "epoch": 3.761518987341772, "percentage": 75.22, "elapsed_time": "5:51:01", "remaining_time": "1:55:37"}
|
| 930 |
+
{"current_steps": 930, "total_steps": 1235, "loss": 0.1707, "lr": 7.0314777601485155e-06, "epoch": 3.7655696202531646, "percentage": 75.3, "elapsed_time": "5:51:23", "remaining_time": "1:55:14"}
|
| 931 |
+
{"current_steps": 931, "total_steps": 1235, "loss": 0.1729, "lr": 6.988476126329604e-06, "epoch": 3.769620253164557, "percentage": 75.38, "elapsed_time": "5:51:45", "remaining_time": "1:54:51"}
|
| 932 |
+
{"current_steps": 932, "total_steps": 1235, "loss": 0.1757, "lr": 6.945578532308857e-06, "epoch": 3.7736708860759496, "percentage": 75.47, "elapsed_time": "5:52:06", "remaining_time": "1:54:28"}
|
| 933 |
+
{"current_steps": 933, "total_steps": 1235, "loss": 0.1628, "lr": 6.902785321094301e-06, "epoch": 3.7777215189873417, "percentage": 75.55, "elapsed_time": "5:52:29", "remaining_time": "1:54:05"}
|
| 934 |
+
{"current_steps": 934, "total_steps": 1235, "loss": 0.1786, "lr": 6.8600968348593115e-06, "epoch": 3.781772151898734, "percentage": 75.63, "elapsed_time": "5:52:51", "remaining_time": "1:53:43"}
|
| 935 |
+
{"current_steps": 935, "total_steps": 1235, "loss": 0.1511, "lr": 6.817513414939892e-06, "epoch": 3.7858227848101267, "percentage": 75.71, "elapsed_time": "5:53:13", "remaining_time": "1:53:19"}
|
| 936 |
+
{"current_steps": 936, "total_steps": 1235, "loss": 0.1681, "lr": 6.775035401831924e-06, "epoch": 3.7898734177215188, "percentage": 75.79, "elapsed_time": "5:53:34", "remaining_time": "1:52:56"}
|
| 937 |
+
{"current_steps": 937, "total_steps": 1235, "loss": 0.166, "lr": 6.732663135188473e-06, "epoch": 3.7939240506329113, "percentage": 75.87, "elapsed_time": "5:53:55", "remaining_time": "1:52:33"}
|
| 938 |
+
{"current_steps": 938, "total_steps": 1235, "loss": 0.1711, "lr": 6.690396953817055e-06, "epoch": 3.797974683544304, "percentage": 75.95, "elapsed_time": "5:54:18", "remaining_time": "1:52:11"}
|
| 939 |
+
{"current_steps": 939, "total_steps": 1235, "loss": 0.171, "lr": 6.648237195676927e-06, "epoch": 3.8020253164556963, "percentage": 76.03, "elapsed_time": "5:54:40", "remaining_time": "1:51:48"}
|
| 940 |
+
{"current_steps": 940, "total_steps": 1235, "loss": 0.1632, "lr": 6.606184197876395e-06, "epoch": 3.806075949367089, "percentage": 76.11, "elapsed_time": "5:55:02", "remaining_time": "1:51:25"}
|
| 941 |
+
{"current_steps": 941, "total_steps": 1235, "loss": 0.1613, "lr": 6.564238296670109e-06, "epoch": 3.810126582278481, "percentage": 76.19, "elapsed_time": "5:55:25", "remaining_time": "1:51:02"}
|
| 942 |
+
{"current_steps": 942, "total_steps": 1235, "loss": 0.1636, "lr": 6.52239982745638e-06, "epoch": 3.8141772151898734, "percentage": 76.28, "elapsed_time": "5:55:47", "remaining_time": "1:50:39"}
|
| 943 |
+
{"current_steps": 943, "total_steps": 1235, "loss": 0.1749, "lr": 6.480669124774484e-06, "epoch": 3.818227848101266, "percentage": 76.36, "elapsed_time": "5:56:08", "remaining_time": "1:50:16"}
|
| 944 |
+
{"current_steps": 944, "total_steps": 1235, "loss": 0.1679, "lr": 6.439046522302013e-06, "epoch": 3.822278481012658, "percentage": 76.44, "elapsed_time": "5:56:32", "remaining_time": "1:49:54"}
|
| 945 |
+
{"current_steps": 945, "total_steps": 1235, "loss": 0.1694, "lr": 6.397532352852191e-06, "epoch": 3.8263291139240505, "percentage": 76.52, "elapsed_time": "5:56:56", "remaining_time": "1:49:32"}
|
| 946 |
+
{"current_steps": 946, "total_steps": 1235, "loss": 0.1662, "lr": 6.356126948371202e-06, "epoch": 3.830379746835443, "percentage": 76.6, "elapsed_time": "5:57:18", "remaining_time": "1:49:09"}
|
| 947 |
+
{"current_steps": 947, "total_steps": 1235, "loss": 0.163, "lr": 6.314830639935559e-06, "epoch": 3.8344303797468355, "percentage": 76.68, "elapsed_time": "5:57:41", "remaining_time": "1:48:46"}
|
| 948 |
+
{"current_steps": 948, "total_steps": 1235, "loss": 0.1596, "lr": 6.273643757749448e-06, "epoch": 3.838481012658228, "percentage": 76.76, "elapsed_time": "5:58:03", "remaining_time": "1:48:24"}
|
| 949 |
+
{"current_steps": 949, "total_steps": 1235, "loss": 0.1795, "lr": 6.2325666311420856e-06, "epoch": 3.84253164556962, "percentage": 76.84, "elapsed_time": "5:58:26", "remaining_time": "1:48:01"}
|
| 950 |
+
{"current_steps": 950, "total_steps": 1235, "loss": 0.1758, "lr": 6.1915995885650675e-06, "epoch": 3.8465822784810126, "percentage": 76.92, "elapsed_time": "5:58:50", "remaining_time": "1:47:39"}
|
| 951 |
+
{"current_steps": 951, "total_steps": 1235, "loss": 0.1708, "lr": 6.150742957589784e-06, "epoch": 3.850632911392405, "percentage": 77.0, "elapsed_time": "5:59:14", "remaining_time": "1:47:16"}
|
| 952 |
+
{"current_steps": 952, "total_steps": 1235, "loss": 0.1702, "lr": 6.109997064904774e-06, "epoch": 3.8546835443037972, "percentage": 77.09, "elapsed_time": "5:59:35", "remaining_time": "1:46:53"}
|
| 953 |
+
{"current_steps": 953, "total_steps": 1235, "loss": 0.1659, "lr": 6.069362236313092e-06, "epoch": 3.8587341772151897, "percentage": 77.17, "elapsed_time": "5:59:57", "remaining_time": "1:46:30"}
|
| 954 |
+
{"current_steps": 954, "total_steps": 1235, "loss": 0.1672, "lr": 6.0288387967297565e-06, "epoch": 3.8627848101265823, "percentage": 77.25, "elapsed_time": "6:00:19", "remaining_time": "1:46:08"}
|
| 955 |
+
{"current_steps": 955, "total_steps": 1235, "loss": 0.1705, "lr": 5.988427070179108e-06, "epoch": 3.8668354430379748, "percentage": 77.33, "elapsed_time": "6:00:41", "remaining_time": "1:45:45"}
|
| 956 |
+
{"current_steps": 956, "total_steps": 1235, "loss": 0.1723, "lr": 5.948127379792234e-06, "epoch": 3.8708860759493673, "percentage": 77.41, "elapsed_time": "6:01:04", "remaining_time": "1:45:22"}
|
| 957 |
+
{"current_steps": 957, "total_steps": 1235, "loss": 0.1686, "lr": 5.90794004780439e-06, "epoch": 3.8749367088607594, "percentage": 77.49, "elapsed_time": "6:01:25", "remaining_time": "1:44:59"}
|
| 958 |
+
{"current_steps": 958, "total_steps": 1235, "loss": 0.163, "lr": 5.867865395552405e-06, "epoch": 3.878987341772152, "percentage": 77.57, "elapsed_time": "6:01:48", "remaining_time": "1:44:36"}
|
| 959 |
+
{"current_steps": 959, "total_steps": 1235, "loss": 0.1682, "lr": 5.8279037434721364e-06, "epoch": 3.8830379746835444, "percentage": 77.65, "elapsed_time": "6:02:10", "remaining_time": "1:44:14"}
|
| 960 |
+
{"current_steps": 960, "total_steps": 1235, "loss": 0.16, "lr": 5.788055411095892e-06, "epoch": 3.8870886075949365, "percentage": 77.73, "elapsed_time": "6:02:33", "remaining_time": "1:43:51"}
|
| 961 |
+
{"current_steps": 961, "total_steps": 1235, "loss": 0.1767, "lr": 5.7483207170498625e-06, "epoch": 3.891139240506329, "percentage": 77.81, "elapsed_time": "6:02:55", "remaining_time": "1:43:28"}
|
| 962 |
+
{"current_steps": 962, "total_steps": 1235, "loss": 0.1695, "lr": 5.708699979051613e-06, "epoch": 3.8951898734177215, "percentage": 77.89, "elapsed_time": "6:03:18", "remaining_time": "1:43:05"}
|
| 963 |
+
{"current_steps": 963, "total_steps": 1235, "loss": 0.1708, "lr": 5.66919351390751e-06, "epoch": 3.899240506329114, "percentage": 77.98, "elapsed_time": "6:03:42", "remaining_time": "1:42:43"}
|
| 964 |
+
{"current_steps": 964, "total_steps": 1235, "loss": 0.1666, "lr": 5.629801637510188e-06, "epoch": 3.9032911392405065, "percentage": 78.06, "elapsed_time": "6:04:05", "remaining_time": "1:42:21"}
|
| 965 |
+
{"current_steps": 965, "total_steps": 1235, "loss": 0.1739, "lr": 5.590524664836043e-06, "epoch": 3.9073417721518986, "percentage": 78.14, "elapsed_time": "6:04:26", "remaining_time": "1:41:58"}
|
| 966 |
+
{"current_steps": 966, "total_steps": 1235, "loss": 0.1662, "lr": 5.551362909942708e-06, "epoch": 3.911392405063291, "percentage": 78.22, "elapsed_time": "6:04:47", "remaining_time": "1:41:35"}
|
| 967 |
+
{"current_steps": 967, "total_steps": 1235, "loss": 0.1817, "lr": 5.51231668596653e-06, "epoch": 3.9154430379746836, "percentage": 78.3, "elapsed_time": "6:05:11", "remaining_time": "1:41:12"}
|
| 968 |
+
{"current_steps": 968, "total_steps": 1235, "loss": 0.1712, "lr": 5.47338630512007e-06, "epoch": 3.9194936708860757, "percentage": 78.38, "elapsed_time": "6:05:33", "remaining_time": "1:40:49"}
|
| 969 |
+
{"current_steps": 969, "total_steps": 1235, "loss": 0.1656, "lr": 5.434572078689617e-06, "epoch": 3.923544303797468, "percentage": 78.46, "elapsed_time": "6:05:55", "remaining_time": "1:40:26"}
|
| 970 |
+
{"current_steps": 970, "total_steps": 1235, "loss": 0.1664, "lr": 5.395874317032694e-06, "epoch": 3.9275949367088607, "percentage": 78.54, "elapsed_time": "6:06:20", "remaining_time": "1:40:04"}
|
| 971 |
+
{"current_steps": 971, "total_steps": 1235, "loss": 0.1534, "lr": 5.357293329575573e-06, "epoch": 3.9316455696202532, "percentage": 78.62, "elapsed_time": "6:06:42", "remaining_time": "1:39:42"}
|
| 972 |
+
{"current_steps": 972, "total_steps": 1235, "loss": 0.1716, "lr": 5.318829424810797e-06, "epoch": 3.9356962025316458, "percentage": 78.7, "elapsed_time": "6:07:04", "remaining_time": "1:39:19"}
|
| 973 |
+
{"current_steps": 973, "total_steps": 1235, "loss": 0.1731, "lr": 5.280482910294728e-06, "epoch": 3.939746835443038, "percentage": 78.79, "elapsed_time": "6:07:26", "remaining_time": "1:38:56"}
|
| 974 |
+
{"current_steps": 974, "total_steps": 1235, "loss": 0.1657, "lr": 5.242254092645078e-06, "epoch": 3.9437974683544303, "percentage": 78.87, "elapsed_time": "6:07:48", "remaining_time": "1:38:33"}
|
| 975 |
+
{"current_steps": 975, "total_steps": 1235, "loss": 0.1728, "lr": 5.2041432775384445e-06, "epoch": 3.947848101265823, "percentage": 78.95, "elapsed_time": "6:08:09", "remaining_time": "1:38:10"}
|
| 976 |
+
{"current_steps": 976, "total_steps": 1235, "loss": 0.1618, "lr": 5.166150769707892e-06, "epoch": 3.951898734177215, "percentage": 79.03, "elapsed_time": "6:08:30", "remaining_time": "1:37:47"}
|
| 977 |
+
{"current_steps": 977, "total_steps": 1235, "loss": 0.1585, "lr": 5.128276872940503e-06, "epoch": 3.9559493670886074, "percentage": 79.11, "elapsed_time": "6:08:50", "remaining_time": "1:37:24"}
|
| 978 |
+
{"current_steps": 978, "total_steps": 1235, "loss": 0.1715, "lr": 5.090521890074953e-06, "epoch": 3.96, "percentage": 79.19, "elapsed_time": "6:09:14", "remaining_time": "1:37:01"}
|
| 979 |
+
{"current_steps": 979, "total_steps": 1235, "loss": 0.1695, "lr": 5.0528861229990675e-06, "epoch": 3.9640506329113925, "percentage": 79.27, "elapsed_time": "6:09:37", "remaining_time": "1:36:39"}
|
| 980 |
+
{"current_steps": 980, "total_steps": 1235, "loss": 0.1697, "lr": 5.015369872647442e-06, "epoch": 3.968101265822785, "percentage": 79.35, "elapsed_time": "6:10:00", "remaining_time": "1:36:16"}
|
| 981 |
+
{"current_steps": 981, "total_steps": 1235, "loss": 0.1572, "lr": 4.9779734389990195e-06, "epoch": 3.972151898734177, "percentage": 79.43, "elapsed_time": "6:10:22", "remaining_time": "1:35:53"}
|
| 982 |
+
{"current_steps": 982, "total_steps": 1235, "loss": 0.1655, "lr": 4.940697121074675e-06, "epoch": 3.9762025316455696, "percentage": 79.51, "elapsed_time": "6:10:44", "remaining_time": "1:35:30"}
|
| 983 |
+
{"current_steps": 983, "total_steps": 1235, "loss": 0.1658, "lr": 4.903541216934864e-06, "epoch": 3.980253164556962, "percentage": 79.6, "elapsed_time": "6:11:06", "remaining_time": "1:35:08"}
|
| 984 |
+
{"current_steps": 984, "total_steps": 1235, "loss": 0.162, "lr": 4.8665060236772e-06, "epoch": 3.984303797468354, "percentage": 79.68, "elapsed_time": "6:11:29", "remaining_time": "1:34:45"}
|
| 985 |
+
{"current_steps": 985, "total_steps": 1235, "loss": 0.1723, "lr": 4.829591837434102e-06, "epoch": 3.9883544303797467, "percentage": 79.76, "elapsed_time": "6:11:51", "remaining_time": "1:34:22"}
|
| 986 |
+
{"current_steps": 986, "total_steps": 1235, "loss": 0.1796, "lr": 4.792798953370424e-06, "epoch": 3.992405063291139, "percentage": 79.84, "elapsed_time": "6:12:14", "remaining_time": "1:34:00"}
|
| 987 |
+
{"current_steps": 987, "total_steps": 1235, "loss": 0.1673, "lr": 4.756127665681083e-06, "epoch": 3.9964556962025317, "percentage": 79.92, "elapsed_time": "6:12:36", "remaining_time": "1:33:37"}
|
| 988 |
+
{"current_steps": 988, "total_steps": 1235, "loss": 0.165, "lr": 4.719578267588725e-06, "epoch": 4.0, "percentage": 80.0, "elapsed_time": "6:12:56", "remaining_time": "1:33:14"}
|
| 989 |
+
{"current_steps": 989, "total_steps": 1235, "loss": 0.1201, "lr": 4.6831510513413525e-06, "epoch": 4.004050632911392, "percentage": 80.08, "elapsed_time": "6:14:10", "remaining_time": "1:33:04"}
|
| 990 |
+
{"current_steps": 990, "total_steps": 1235, "loss": 0.1199, "lr": 4.6468463082100176e-06, "epoch": 4.008101265822785, "percentage": 80.16, "elapsed_time": "6:14:33", "remaining_time": "1:32:41"}
|
| 991 |
+
{"current_steps": 991, "total_steps": 1235, "loss": 0.1104, "lr": 4.610664328486485e-06, "epoch": 4.012151898734177, "percentage": 80.24, "elapsed_time": "6:14:56", "remaining_time": "1:32:19"}
|
| 992 |
+
{"current_steps": 992, "total_steps": 1235, "loss": 0.1135, "lr": 4.5746054014809e-06, "epoch": 4.01620253164557, "percentage": 80.32, "elapsed_time": "6:15:19", "remaining_time": "1:31:56"}
|
| 993 |
+
{"current_steps": 993, "total_steps": 1235, "loss": 0.1146, "lr": 4.5386698155194766e-06, "epoch": 4.020253164556962, "percentage": 80.4, "elapsed_time": "6:15:40", "remaining_time": "1:31:33"}
|