Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bef6c55424d99e122ac60cbbf5004d56126bc38562e33818e16b290f40dcad05
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:93d86a74509aaee2f5f49f34e1e59cfaad2e86a75a92317d14a41517da40a323
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0e90fc3538ddd849cf7b5cfbbc98867bea09d97a0ebcbd14ece1d3464158e5f3
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c38ee9ab9dfb7f673b7ea2fce244f466723d08159d577684bf4cecf7d53eebac
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -785,3 +785,246 @@
|
|
| 785 |
{"current_steps": 542, "total_steps": 1215, "loss": 0.3277, "lr": 2.7112766498590944e-05, "epoch": 2.2281603288797536, "percentage": 44.61, "elapsed_time": "3:30:58", "remaining_time": "4:21:58"}
|
| 786 |
{"current_steps": 543, "total_steps": 1215, "loss": 0.3352, "lr": 2.705900971084635e-05, "epoch": 2.2322713257965057, "percentage": 44.69, "elapsed_time": "3:31:21", "remaining_time": "4:21:34"}
|
| 787 |
{"current_steps": 544, "total_steps": 1215, "loss": 0.3334, "lr": 2.7005194605064122e-05, "epoch": 2.2363823227132578, "percentage": 44.77, "elapsed_time": "3:31:44", "remaining_time": "4:21:11"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 785 |
{"current_steps": 542, "total_steps": 1215, "loss": 0.3277, "lr": 2.7112766498590944e-05, "epoch": 2.2281603288797536, "percentage": 44.61, "elapsed_time": "3:30:58", "remaining_time": "4:21:58"}
|
| 786 |
{"current_steps": 543, "total_steps": 1215, "loss": 0.3352, "lr": 2.705900971084635e-05, "epoch": 2.2322713257965057, "percentage": 44.69, "elapsed_time": "3:31:21", "remaining_time": "4:21:34"}
|
| 787 |
{"current_steps": 544, "total_steps": 1215, "loss": 0.3334, "lr": 2.7005194605064122e-05, "epoch": 2.2363823227132578, "percentage": 44.77, "elapsed_time": "3:31:44", "remaining_time": "4:21:11"}
|
| 788 |
+
{"current_steps": 545, "total_steps": 1215, "loss": 0.3299, "lr": 2.6951321625837975e-05, "epoch": 2.2404933196300103, "percentage": 44.86, "elapsed_time": "3:32:08", "remaining_time": "4:20:47"}
|
| 789 |
+
{"current_steps": 546, "total_steps": 1215, "loss": 0.3338, "lr": 2.6897391218239746e-05, "epoch": 2.2446043165467624, "percentage": 44.94, "elapsed_time": "3:32:30", "remaining_time": "4:20:23"}
|
| 790 |
+
{"current_steps": 547, "total_steps": 1215, "loss": 0.3353, "lr": 2.6843403827815714e-05, "epoch": 2.248715313463515, "percentage": 45.02, "elapsed_time": "3:32:53", "remaining_time": "4:19:58"}
|
| 791 |
+
{"current_steps": 548, "total_steps": 1215, "loss": 0.3274, "lr": 2.6789359900582935e-05, "epoch": 2.252826310380267, "percentage": 45.1, "elapsed_time": "3:33:16", "remaining_time": "4:19:35"}
|
| 792 |
+
{"current_steps": 549, "total_steps": 1215, "loss": 0.344, "lr": 2.673525988302553e-05, "epoch": 2.2569373072970196, "percentage": 45.19, "elapsed_time": "3:33:39", "remaining_time": "4:19:11"}
|
| 793 |
+
{"current_steps": 550, "total_steps": 1215, "loss": 0.3387, "lr": 2.6681104222091018e-05, "epoch": 2.2610483042137717, "percentage": 45.27, "elapsed_time": "3:34:03", "remaining_time": "4:18:48"}
|
| 794 |
+
{"current_steps": 551, "total_steps": 1215, "loss": 0.3306, "lr": 2.662689336518661e-05, "epoch": 2.265159301130524, "percentage": 45.35, "elapsed_time": "3:34:25", "remaining_time": "4:18:24"}
|
| 795 |
+
{"current_steps": 552, "total_steps": 1215, "loss": 0.334, "lr": 2.6572627760175523e-05, "epoch": 2.2692702980472763, "percentage": 45.43, "elapsed_time": "3:34:49", "remaining_time": "4:18:01"}
|
| 796 |
+
{"current_steps": 553, "total_steps": 1215, "loss": 0.3245, "lr": 2.6518307855373276e-05, "epoch": 2.273381294964029, "percentage": 45.51, "elapsed_time": "3:35:12", "remaining_time": "4:17:37"}
|
| 797 |
+
{"current_steps": 554, "total_steps": 1215, "loss": 0.3337, "lr": 2.6463934099543992e-05, "epoch": 2.277492291880781, "percentage": 45.6, "elapsed_time": "3:35:34", "remaining_time": "4:17:12"}
|
| 798 |
+
{"current_steps": 555, "total_steps": 1215, "loss": 0.336, "lr": 2.6409506941896665e-05, "epoch": 2.2816032887975335, "percentage": 45.68, "elapsed_time": "3:35:58", "remaining_time": "4:16:49"}
|
| 799 |
+
{"current_steps": 556, "total_steps": 1215, "loss": 0.331, "lr": 2.6355026832081493e-05, "epoch": 2.2857142857142856, "percentage": 45.76, "elapsed_time": "3:36:20", "remaining_time": "4:16:25"}
|
| 800 |
+
{"current_steps": 557, "total_steps": 1215, "loss": 0.3318, "lr": 2.6300494220186113e-05, "epoch": 2.289825282631038, "percentage": 45.84, "elapsed_time": "3:36:43", "remaining_time": "4:16:00"}
|
| 801 |
+
{"current_steps": 558, "total_steps": 1215, "loss": 0.3244, "lr": 2.6245909556731937e-05, "epoch": 2.2939362795477902, "percentage": 45.93, "elapsed_time": "3:37:06", "remaining_time": "4:15:37"}
|
| 802 |
+
{"current_steps": 559, "total_steps": 1215, "loss": 0.3342, "lr": 2.6191273292670372e-05, "epoch": 2.2980472764645428, "percentage": 46.01, "elapsed_time": "3:37:28", "remaining_time": "4:15:13"}
|
| 803 |
+
{"current_steps": 560, "total_steps": 1215, "loss": 0.3394, "lr": 2.6136585879379145e-05, "epoch": 2.302158273381295, "percentage": 46.09, "elapsed_time": "3:37:53", "remaining_time": "4:14:50"}
|
| 804 |
+
{"current_steps": 561, "total_steps": 1215, "loss": 0.3289, "lr": 2.608184776865854e-05, "epoch": 2.3062692702980474, "percentage": 46.17, "elapsed_time": "3:38:16", "remaining_time": "4:14:27"}
|
| 805 |
+
{"current_steps": 562, "total_steps": 1215, "loss": 0.322, "lr": 2.602705941272769e-05, "epoch": 2.3103802672147995, "percentage": 46.26, "elapsed_time": "3:38:39", "remaining_time": "4:14:04"}
|
| 806 |
+
{"current_steps": 563, "total_steps": 1215, "loss": 0.3332, "lr": 2.597222126422081e-05, "epoch": 2.314491264131552, "percentage": 46.34, "elapsed_time": "3:39:02", "remaining_time": "4:13:40"}
|
| 807 |
+
{"current_steps": 564, "total_steps": 1215, "loss": 0.3228, "lr": 2.5917333776183503e-05, "epoch": 2.318602261048304, "percentage": 46.42, "elapsed_time": "3:39:24", "remaining_time": "4:13:15"}
|
| 808 |
+
{"current_steps": 565, "total_steps": 1215, "loss": 0.3197, "lr": 2.586239740206897e-05, "epoch": 2.3227132579650567, "percentage": 46.5, "elapsed_time": "3:39:48", "remaining_time": "4:12:52"}
|
| 809 |
+
{"current_steps": 566, "total_steps": 1215, "loss": 0.3279, "lr": 2.5807412595734283e-05, "epoch": 2.3268242548818088, "percentage": 46.58, "elapsed_time": "3:40:10", "remaining_time": "4:12:28"}
|
| 810 |
+
{"current_steps": 567, "total_steps": 1215, "loss": 0.324, "lr": 2.5752379811436655e-05, "epoch": 2.3309352517985613, "percentage": 46.67, "elapsed_time": "3:40:33", "remaining_time": "4:12:03"}
|
| 811 |
+
{"current_steps": 568, "total_steps": 1215, "loss": 0.3347, "lr": 2.5697299503829657e-05, "epoch": 2.3350462487153134, "percentage": 46.75, "elapsed_time": "3:40:55", "remaining_time": "4:11:39"}
|
| 812 |
+
{"current_steps": 569, "total_steps": 1215, "loss": 0.3292, "lr": 2.5642172127959475e-05, "epoch": 2.339157245632066, "percentage": 46.83, "elapsed_time": "3:41:17", "remaining_time": "4:11:13"}
|
| 813 |
+
{"current_steps": 570, "total_steps": 1215, "loss": 0.3323, "lr": 2.558699813926115e-05, "epoch": 2.343268242548818, "percentage": 46.91, "elapsed_time": "3:41:40", "remaining_time": "4:10:50"}
|
| 814 |
+
{"current_steps": 571, "total_steps": 1215, "loss": 0.3317, "lr": 2.5531777993554813e-05, "epoch": 2.3473792394655706, "percentage": 47.0, "elapsed_time": "3:42:02", "remaining_time": "4:10:26"}
|
| 815 |
+
{"current_steps": 572, "total_steps": 1215, "loss": 0.3428, "lr": 2.5476512147041926e-05, "epoch": 2.3514902363823227, "percentage": 47.08, "elapsed_time": "3:42:25", "remaining_time": "4:10:01"}
|
| 816 |
+
{"current_steps": 573, "total_steps": 1215, "loss": 0.3284, "lr": 2.5421201056301507e-05, "epoch": 2.3556012332990752, "percentage": 47.16, "elapsed_time": "3:42:48", "remaining_time": "4:09:37"}
|
| 817 |
+
{"current_steps": 574, "total_steps": 1215, "loss": 0.3275, "lr": 2.5365845178286358e-05, "epoch": 2.3597122302158273, "percentage": 47.24, "elapsed_time": "3:43:10", "remaining_time": "4:09:13"}
|
| 818 |
+
{"current_steps": 575, "total_steps": 1215, "loss": 0.3301, "lr": 2.5310444970319292e-05, "epoch": 2.3638232271325794, "percentage": 47.33, "elapsed_time": "3:43:34", "remaining_time": "4:08:50"}
|
| 819 |
+
{"current_steps": 576, "total_steps": 1215, "loss": 0.3375, "lr": 2.525500089008936e-05, "epoch": 2.367934224049332, "percentage": 47.41, "elapsed_time": "3:43:56", "remaining_time": "4:08:26"}
|
| 820 |
+
{"current_steps": 577, "total_steps": 1215, "loss": 0.3207, "lr": 2.5199513395648047e-05, "epoch": 2.3720452209660845, "percentage": 47.49, "elapsed_time": "3:44:18", "remaining_time": "4:08:01"}
|
| 821 |
+
{"current_steps": 578, "total_steps": 1215, "loss": 0.3335, "lr": 2.5143982945405527e-05, "epoch": 2.3761562178828366, "percentage": 47.57, "elapsed_time": "3:44:39", "remaining_time": "4:07:35"}
|
| 822 |
+
{"current_steps": 579, "total_steps": 1215, "loss": 0.3364, "lr": 2.5088409998126827e-05, "epoch": 2.3802672147995887, "percentage": 47.65, "elapsed_time": "3:45:03", "remaining_time": "4:07:13"}
|
| 823 |
+
{"current_steps": 580, "total_steps": 1215, "loss": 0.3296, "lr": 2.5032795012928093e-05, "epoch": 2.3843782117163412, "percentage": 47.74, "elapsed_time": "3:45:25", "remaining_time": "4:06:48"}
|
| 824 |
+
{"current_steps": 581, "total_steps": 1215, "loss": 0.3252, "lr": 2.4977138449272746e-05, "epoch": 2.3884892086330938, "percentage": 47.82, "elapsed_time": "3:45:48", "remaining_time": "4:06:24"}
|
| 825 |
+
{"current_steps": 582, "total_steps": 1215, "loss": 0.3292, "lr": 2.4921440766967718e-05, "epoch": 2.392600205549846, "percentage": 47.9, "elapsed_time": "3:46:12", "remaining_time": "4:06:01"}
|
| 826 |
+
{"current_steps": 583, "total_steps": 1215, "loss": 0.3345, "lr": 2.4865702426159633e-05, "epoch": 2.396711202466598, "percentage": 47.98, "elapsed_time": "3:46:34", "remaining_time": "4:05:37"}
|
| 827 |
+
{"current_steps": 584, "total_steps": 1215, "loss": 0.3272, "lr": 2.4809923887331028e-05, "epoch": 2.4008221993833505, "percentage": 48.07, "elapsed_time": "3:46:56", "remaining_time": "4:05:12"}
|
| 828 |
+
{"current_steps": 585, "total_steps": 1215, "loss": 0.3244, "lr": 2.4754105611296534e-05, "epoch": 2.4049331963001026, "percentage": 48.15, "elapsed_time": "3:47:19", "remaining_time": "4:04:48"}
|
| 829 |
+
{"current_steps": 586, "total_steps": 1215, "loss": 0.3211, "lr": 2.4698248059199056e-05, "epoch": 2.409044193216855, "percentage": 48.23, "elapsed_time": "3:47:41", "remaining_time": "4:04:24"}
|
| 830 |
+
{"current_steps": 587, "total_steps": 1215, "loss": 0.3227, "lr": 2.4642351692505998e-05, "epoch": 2.4131551901336072, "percentage": 48.31, "elapsed_time": "3:48:04", "remaining_time": "4:04:00"}
|
| 831 |
+
{"current_steps": 588, "total_steps": 1215, "loss": 0.3255, "lr": 2.4586416973005414e-05, "epoch": 2.41726618705036, "percentage": 48.4, "elapsed_time": "3:48:27", "remaining_time": "4:03:36"}
|
| 832 |
+
{"current_steps": 589, "total_steps": 1215, "loss": 0.3297, "lr": 2.453044436280223e-05, "epoch": 2.421377183967112, "percentage": 48.48, "elapsed_time": "3:48:50", "remaining_time": "4:03:13"}
|
| 833 |
+
{"current_steps": 590, "total_steps": 1215, "loss": 0.3351, "lr": 2.4474434324314388e-05, "epoch": 2.4254881808838644, "percentage": 48.56, "elapsed_time": "3:49:12", "remaining_time": "4:02:48"}
|
| 834 |
+
{"current_steps": 591, "total_steps": 1215, "loss": 0.3185, "lr": 2.4418387320269047e-05, "epoch": 2.4295991778006165, "percentage": 48.64, "elapsed_time": "3:49:36", "remaining_time": "4:02:25"}
|
| 835 |
+
{"current_steps": 592, "total_steps": 1215, "loss": 0.3262, "lr": 2.4362303813698766e-05, "epoch": 2.433710174717369, "percentage": 48.72, "elapsed_time": "3:50:00", "remaining_time": "4:02:02"}
|
| 836 |
+
{"current_steps": 593, "total_steps": 1215, "loss": 0.3317, "lr": 2.4306184267937654e-05, "epoch": 2.437821171634121, "percentage": 48.81, "elapsed_time": "3:50:22", "remaining_time": "4:01:38"}
|
| 837 |
+
{"current_steps": 594, "total_steps": 1215, "loss": 0.3325, "lr": 2.425002914661758e-05, "epoch": 2.4419321685508737, "percentage": 48.89, "elapsed_time": "3:50:44", "remaining_time": "4:01:13"}
|
| 838 |
+
{"current_steps": 595, "total_steps": 1215, "loss": 0.3186, "lr": 2.419383891366431e-05, "epoch": 2.446043165467626, "percentage": 48.97, "elapsed_time": "3:51:07", "remaining_time": "4:00:50"}
|
| 839 |
+
{"current_steps": 596, "total_steps": 1215, "loss": 0.3325, "lr": 2.4137614033293676e-05, "epoch": 2.4501541623843783, "percentage": 49.05, "elapsed_time": "3:51:29", "remaining_time": "4:00:25"}
|
| 840 |
+
{"current_steps": 597, "total_steps": 1215, "loss": 0.3258, "lr": 2.408135497000776e-05, "epoch": 2.4542651593011304, "percentage": 49.14, "elapsed_time": "3:51:53", "remaining_time": "4:00:03"}
|
| 841 |
+
{"current_steps": 598, "total_steps": 1215, "loss": 0.3286, "lr": 2.4025062188591046e-05, "epoch": 2.458376156217883, "percentage": 49.22, "elapsed_time": "3:52:15", "remaining_time": "3:59:38"}
|
| 842 |
+
{"current_steps": 599, "total_steps": 1215, "loss": 0.3257, "lr": 2.3968736154106574e-05, "epoch": 2.462487153134635, "percentage": 49.3, "elapsed_time": "3:52:38", "remaining_time": "3:59:14"}
|
| 843 |
+
{"current_steps": 600, "total_steps": 1215, "loss": 0.3348, "lr": 2.3912377331892112e-05, "epoch": 2.4665981500513876, "percentage": 49.38, "elapsed_time": "3:53:01", "remaining_time": "3:58:50"}
|
| 844 |
+
{"current_steps": 601, "total_steps": 1215, "loss": 0.3247, "lr": 2.3855986187556295e-05, "epoch": 2.4707091469681397, "percentage": 49.47, "elapsed_time": "3:53:23", "remaining_time": "3:58:26"}
|
| 845 |
+
{"current_steps": 602, "total_steps": 1215, "loss": 0.3288, "lr": 2.3799563186974802e-05, "epoch": 2.4748201438848922, "percentage": 49.55, "elapsed_time": "3:53:45", "remaining_time": "3:58:01"}
|
| 846 |
+
{"current_steps": 603, "total_steps": 1215, "loss": 0.3343, "lr": 2.374310879628647e-05, "epoch": 2.4789311408016443, "percentage": 49.63, "elapsed_time": "3:54:09", "remaining_time": "3:57:38"}
|
| 847 |
+
{"current_steps": 604, "total_steps": 1215, "loss": 0.3355, "lr": 2.3686623481889496e-05, "epoch": 2.483042137718397, "percentage": 49.71, "elapsed_time": "3:54:31", "remaining_time": "3:57:14"}
|
| 848 |
+
{"current_steps": 605, "total_steps": 1215, "loss": 0.3296, "lr": 2.3630107710437526e-05, "epoch": 2.487153134635149, "percentage": 49.79, "elapsed_time": "3:54:54", "remaining_time": "3:56:51"}
|
| 849 |
+
{"current_steps": 606, "total_steps": 1215, "loss": 0.3421, "lr": 2.3573561948835836e-05, "epoch": 2.4912641315519015, "percentage": 49.88, "elapsed_time": "3:55:17", "remaining_time": "3:56:27"}
|
| 850 |
+
{"current_steps": 607, "total_steps": 1215, "loss": 0.3254, "lr": 2.3516986664237474e-05, "epoch": 2.4953751284686536, "percentage": 49.96, "elapsed_time": "3:55:41", "remaining_time": "3:56:04"}
|
| 851 |
+
{"current_steps": 608, "total_steps": 1215, "loss": 0.3272, "lr": 2.3460382324039377e-05, "epoch": 2.499486125385406, "percentage": 50.04, "elapsed_time": "3:56:03", "remaining_time": "3:55:40"}
|
| 852 |
+
{"current_steps": 609, "total_steps": 1215, "loss": 0.3292, "lr": 2.3403749395878542e-05, "epoch": 2.5035971223021583, "percentage": 50.12, "elapsed_time": "3:56:27", "remaining_time": "3:55:17"}
|
| 853 |
+
{"current_steps": 610, "total_steps": 1215, "loss": 0.3307, "lr": 2.3347088347628128e-05, "epoch": 2.5077081192189103, "percentage": 50.21, "elapsed_time": "3:56:50", "remaining_time": "3:54:53"}
|
| 854 |
+
{"current_steps": 611, "total_steps": 1215, "loss": 0.324, "lr": 2.3290399647393628e-05, "epoch": 2.511819116135663, "percentage": 50.29, "elapsed_time": "3:57:12", "remaining_time": "3:54:29"}
|
| 855 |
+
{"current_steps": 612, "total_steps": 1215, "loss": 0.3343, "lr": 2.3233683763508957e-05, "epoch": 2.5159301130524154, "percentage": 50.37, "elapsed_time": "3:57:36", "remaining_time": "3:54:06"}
|
| 856 |
+
{"current_steps": 613, "total_steps": 1215, "loss": 0.34, "lr": 2.317694116453263e-05, "epoch": 2.5200411099691675, "percentage": 50.45, "elapsed_time": "3:57:59", "remaining_time": "3:53:43"}
|
| 857 |
+
{"current_steps": 614, "total_steps": 1215, "loss": 0.3338, "lr": 2.3120172319243864e-05, "epoch": 2.5241521068859196, "percentage": 50.53, "elapsed_time": "3:58:23", "remaining_time": "3:53:20"}
|
| 858 |
+
{"current_steps": 615, "total_steps": 1215, "loss": 0.3311, "lr": 2.3063377696638707e-05, "epoch": 2.528263103802672, "percentage": 50.62, "elapsed_time": "3:58:46", "remaining_time": "3:52:57"}
|
| 859 |
+
{"current_steps": 616, "total_steps": 1215, "loss": 0.3335, "lr": 2.300655776592616e-05, "epoch": 2.5323741007194247, "percentage": 50.7, "elapsed_time": "3:59:08", "remaining_time": "3:52:32"}
|
| 860 |
+
{"current_steps": 617, "total_steps": 1215, "loss": 0.3235, "lr": 2.294971299652432e-05, "epoch": 2.536485097636177, "percentage": 50.78, "elapsed_time": "3:59:32", "remaining_time": "3:52:09"}
|
| 861 |
+
{"current_steps": 618, "total_steps": 1215, "loss": 0.3321, "lr": 2.2892843858056474e-05, "epoch": 2.540596094552929, "percentage": 50.86, "elapsed_time": "3:59:54", "remaining_time": "3:51:45"}
|
| 862 |
+
{"current_steps": 619, "total_steps": 1215, "loss": 0.3167, "lr": 2.283595082034725e-05, "epoch": 2.5447070914696814, "percentage": 50.95, "elapsed_time": "4:00:18", "remaining_time": "3:51:22"}
|
| 863 |
+
{"current_steps": 620, "total_steps": 1215, "loss": 0.3324, "lr": 2.2779034353418707e-05, "epoch": 2.548818088386434, "percentage": 51.03, "elapsed_time": "4:00:40", "remaining_time": "3:50:58"}
|
| 864 |
+
{"current_steps": 621, "total_steps": 1215, "loss": 0.3286, "lr": 2.2722094927486472e-05, "epoch": 2.552929085303186, "percentage": 51.11, "elapsed_time": "4:01:02", "remaining_time": "3:50:33"}
|
| 865 |
+
{"current_steps": 622, "total_steps": 1215, "loss": 0.3383, "lr": 2.2665133012955844e-05, "epoch": 2.557040082219938, "percentage": 51.19, "elapsed_time": "4:01:25", "remaining_time": "3:50:10"}
|
| 866 |
+
{"current_steps": 623, "total_steps": 1215, "loss": 0.3289, "lr": 2.2608149080417913e-05, "epoch": 2.5611510791366907, "percentage": 51.28, "elapsed_time": "4:01:47", "remaining_time": "3:49:46"}
|
| 867 |
+
{"current_steps": 624, "total_steps": 1215, "loss": 0.3244, "lr": 2.2551143600645672e-05, "epoch": 2.565262076053443, "percentage": 51.36, "elapsed_time": "4:02:11", "remaining_time": "3:49:22"}
|
| 868 |
+
{"current_steps": 625, "total_steps": 1215, "loss": 0.3361, "lr": 2.249411704459013e-05, "epoch": 2.5693730729701953, "percentage": 51.44, "elapsed_time": "4:02:34", "remaining_time": "3:48:58"}
|
| 869 |
+
{"current_steps": 626, "total_steps": 1215, "loss": 0.3142, "lr": 2.2437069883376404e-05, "epoch": 2.5734840698869474, "percentage": 51.52, "elapsed_time": "4:02:57", "remaining_time": "3:48:35"}
|
| 870 |
+
{"current_steps": 627, "total_steps": 1215, "loss": 0.324, "lr": 2.238000258829986e-05, "epoch": 2.5775950668037, "percentage": 51.6, "elapsed_time": "4:03:21", "remaining_time": "3:48:13"}
|
| 871 |
+
{"current_steps": 628, "total_steps": 1215, "loss": 0.3226, "lr": 2.2322915630822184e-05, "epoch": 2.581706063720452, "percentage": 51.69, "elapsed_time": "4:03:44", "remaining_time": "3:47:49"}
|
| 872 |
+
{"current_steps": 629, "total_steps": 1215, "loss": 0.3315, "lr": 2.226580948256751e-05, "epoch": 2.5858170606372046, "percentage": 51.77, "elapsed_time": "4:04:07", "remaining_time": "3:47:26"}
|
| 873 |
+
{"current_steps": 630, "total_steps": 1215, "loss": 0.3291, "lr": 2.2208684615318515e-05, "epoch": 2.5899280575539567, "percentage": 51.85, "elapsed_time": "4:04:30", "remaining_time": "3:47:02"}
|
| 874 |
+
{"current_steps": 631, "total_steps": 1215, "loss": 0.3348, "lr": 2.2151541501012526e-05, "epoch": 2.5940390544707093, "percentage": 51.93, "elapsed_time": "4:04:53", "remaining_time": "3:46:38"}
|
| 875 |
+
{"current_steps": 632, "total_steps": 1215, "loss": 0.336, "lr": 2.2094380611737615e-05, "epoch": 2.5981500513874614, "percentage": 52.02, "elapsed_time": "4:05:15", "remaining_time": "3:46:14"}
|
| 876 |
+
{"current_steps": 633, "total_steps": 1215, "loss": 0.3221, "lr": 2.20372024197287e-05, "epoch": 2.602261048304214, "percentage": 52.1, "elapsed_time": "4:05:38", "remaining_time": "3:45:51"}
|
| 877 |
+
{"current_steps": 634, "total_steps": 1215, "loss": 0.3283, "lr": 2.1980007397363653e-05, "epoch": 2.606372045220966, "percentage": 52.18, "elapsed_time": "4:06:01", "remaining_time": "3:45:27"}
|
| 878 |
+
{"current_steps": 635, "total_steps": 1215, "loss": 0.3391, "lr": 2.1922796017159382e-05, "epoch": 2.6104830421377185, "percentage": 52.26, "elapsed_time": "4:06:25", "remaining_time": "3:45:04"}
|
| 879 |
+
{"current_steps": 636, "total_steps": 1215, "loss": 0.3181, "lr": 2.186556875176794e-05, "epoch": 2.6145940390544706, "percentage": 52.35, "elapsed_time": "4:06:48", "remaining_time": "3:44:41"}
|
| 880 |
+
{"current_steps": 637, "total_steps": 1215, "loss": 0.3334, "lr": 2.1808326073972618e-05, "epoch": 2.618705035971223, "percentage": 52.43, "elapsed_time": "4:07:12", "remaining_time": "3:44:18"}
|
| 881 |
+
{"current_steps": 638, "total_steps": 1215, "loss": 0.3328, "lr": 2.1751068456684026e-05, "epoch": 2.6228160328879753, "percentage": 52.51, "elapsed_time": "4:07:36", "remaining_time": "3:43:55"}
|
| 882 |
+
{"current_steps": 639, "total_steps": 1215, "loss": 0.3348, "lr": 2.1693796372936207e-05, "epoch": 2.626927029804728, "percentage": 52.59, "elapsed_time": "4:07:59", "remaining_time": "3:43:32"}
|
| 883 |
+
{"current_steps": 640, "total_steps": 1215, "loss": 0.3287, "lr": 2.1636510295882723e-05, "epoch": 2.63103802672148, "percentage": 52.67, "elapsed_time": "4:08:23", "remaining_time": "3:43:09"}
|
| 884 |
+
{"current_steps": 641, "total_steps": 1215, "loss": 0.3357, "lr": 2.1579210698792724e-05, "epoch": 2.635149023638232, "percentage": 52.76, "elapsed_time": "4:08:46", "remaining_time": "3:42:46"}
|
| 885 |
+
{"current_steps": 642, "total_steps": 1215, "loss": 0.3254, "lr": 2.1521898055047065e-05, "epoch": 2.6392600205549845, "percentage": 52.84, "elapsed_time": "4:09:09", "remaining_time": "3:42:22"}
|
| 886 |
+
{"current_steps": 643, "total_steps": 1215, "loss": 0.3405, "lr": 2.1464572838134393e-05, "epoch": 2.643371017471737, "percentage": 52.92, "elapsed_time": "4:09:32", "remaining_time": "3:41:59"}
|
| 887 |
+
{"current_steps": 644, "total_steps": 1215, "loss": 0.3337, "lr": 2.1407235521647216e-05, "epoch": 2.647482014388489, "percentage": 53.0, "elapsed_time": "4:09:55", "remaining_time": "3:41:36"}
|
| 888 |
+
{"current_steps": 645, "total_steps": 1215, "loss": 0.3223, "lr": 2.134988657927802e-05, "epoch": 2.6515930113052413, "percentage": 53.09, "elapsed_time": "4:10:19", "remaining_time": "3:41:13"}
|
| 889 |
+
{"current_steps": 646, "total_steps": 1215, "loss": 0.3399, "lr": 2.129252648481532e-05, "epoch": 2.655704008221994, "percentage": 53.17, "elapsed_time": "4:10:43", "remaining_time": "3:40:50"}
|
| 890 |
+
{"current_steps": 647, "total_steps": 1215, "loss": 0.3199, "lr": 2.123515571213977e-05, "epoch": 2.6598150051387464, "percentage": 53.25, "elapsed_time": "4:11:05", "remaining_time": "3:40:26"}
|
| 891 |
+
{"current_steps": 648, "total_steps": 1215, "loss": 0.3211, "lr": 2.1177774735220246e-05, "epoch": 2.6639260020554985, "percentage": 53.33, "elapsed_time": "4:11:28", "remaining_time": "3:40:02"}
|
| 892 |
+
{"current_steps": 649, "total_steps": 1215, "loss": 0.3347, "lr": 2.1120384028109928e-05, "epoch": 2.6680369989722506, "percentage": 53.42, "elapsed_time": "4:11:51", "remaining_time": "3:39:39"}
|
| 893 |
+
{"current_steps": 650, "total_steps": 1215, "loss": 0.337, "lr": 2.106298406494237e-05, "epoch": 2.672147995889003, "percentage": 53.5, "elapsed_time": "4:12:14", "remaining_time": "3:39:15"}
|
| 894 |
+
{"current_steps": 651, "total_steps": 1215, "loss": 0.3286, "lr": 2.1005575319927606e-05, "epoch": 2.6762589928057556, "percentage": 53.58, "elapsed_time": "4:12:38", "remaining_time": "3:38:52"}
|
| 895 |
+
{"current_steps": 652, "total_steps": 1215, "loss": 0.3344, "lr": 2.094815826734822e-05, "epoch": 2.6803699897225077, "percentage": 53.66, "elapsed_time": "4:13:01", "remaining_time": "3:38:29"}
|
| 896 |
+
{"current_steps": 653, "total_steps": 1215, "loss": 0.3347, "lr": 2.089073338155542e-05, "epoch": 2.68448098663926, "percentage": 53.74, "elapsed_time": "4:13:24", "remaining_time": "3:38:05"}
|
| 897 |
+
{"current_steps": 654, "total_steps": 1215, "loss": 0.3368, "lr": 2.0833301136965138e-05, "epoch": 2.6885919835560124, "percentage": 53.83, "elapsed_time": "4:13:47", "remaining_time": "3:37:42"}
|
| 898 |
+
{"current_steps": 655, "total_steps": 1215, "loss": 0.3317, "lr": 2.0775862008054102e-05, "epoch": 2.692702980472765, "percentage": 53.91, "elapsed_time": "4:14:10", "remaining_time": "3:37:18"}
|
| 899 |
+
{"current_steps": 656, "total_steps": 1215, "loss": 0.3327, "lr": 2.0718416469355917e-05, "epoch": 2.696813977389517, "percentage": 53.99, "elapsed_time": "4:14:32", "remaining_time": "3:36:54"}
|
| 900 |
+
{"current_steps": 657, "total_steps": 1215, "loss": 0.3254, "lr": 2.066096499545712e-05, "epoch": 2.700924974306269, "percentage": 54.07, "elapsed_time": "4:14:55", "remaining_time": "3:36:31"}
|
| 901 |
+
{"current_steps": 658, "total_steps": 1215, "loss": 0.3324, "lr": 2.0603508060993306e-05, "epoch": 2.7050359712230216, "percentage": 54.16, "elapsed_time": "4:15:18", "remaining_time": "3:36:07"}
|
| 902 |
+
{"current_steps": 659, "total_steps": 1215, "loss": 0.33, "lr": 2.0546046140645178e-05, "epoch": 2.7091469681397737, "percentage": 54.24, "elapsed_time": "4:15:41", "remaining_time": "3:35:43"}
|
| 903 |
+
{"current_steps": 660, "total_steps": 1215, "loss": 0.3375, "lr": 2.0488579709134623e-05, "epoch": 2.7132579650565263, "percentage": 54.32, "elapsed_time": "4:16:03", "remaining_time": "3:35:19"}
|
| 904 |
+
{"current_steps": 661, "total_steps": 1215, "loss": 0.3324, "lr": 2.04311092412208e-05, "epoch": 2.7173689619732784, "percentage": 54.4, "elapsed_time": "4:16:26", "remaining_time": "3:34:56"}
|
| 905 |
+
{"current_steps": 662, "total_steps": 1215, "loss": 0.331, "lr": 2.0373635211696214e-05, "epoch": 2.721479958890031, "percentage": 54.49, "elapsed_time": "4:16:49", "remaining_time": "3:34:32"}
|
| 906 |
+
{"current_steps": 663, "total_steps": 1215, "loss": 0.3354, "lr": 2.0316158095382797e-05, "epoch": 2.725590955806783, "percentage": 54.57, "elapsed_time": "4:17:12", "remaining_time": "3:34:09"}
|
| 907 |
+
{"current_steps": 664, "total_steps": 1215, "loss": 0.3236, "lr": 2.0258678367127972e-05, "epoch": 2.7297019527235356, "percentage": 54.65, "elapsed_time": "4:17:35", "remaining_time": "3:33:45"}
|
| 908 |
+
{"current_steps": 665, "total_steps": 1215, "loss": 0.3232, "lr": 2.0201196501800768e-05, "epoch": 2.7338129496402876, "percentage": 54.73, "elapsed_time": "4:17:58", "remaining_time": "3:33:21"}
|
| 909 |
+
{"current_steps": 666, "total_steps": 1215, "loss": 0.3277, "lr": 2.0143712974287838e-05, "epoch": 2.73792394655704, "percentage": 54.81, "elapsed_time": "4:18:19", "remaining_time": "3:32:56"}
|
| 910 |
+
{"current_steps": 667, "total_steps": 1215, "loss": 0.3419, "lr": 2.0086228259489578e-05, "epoch": 2.7420349434737923, "percentage": 54.9, "elapsed_time": "4:18:43", "remaining_time": "3:32:33"}
|
| 911 |
+
{"current_steps": 668, "total_steps": 1215, "loss": 0.3241, "lr": 2.0028742832316202e-05, "epoch": 2.746145940390545, "percentage": 54.98, "elapsed_time": "4:19:06", "remaining_time": "3:32:10"}
|
| 912 |
+
{"current_steps": 669, "total_steps": 1215, "loss": 0.3206, "lr": 1.99712571676838e-05, "epoch": 2.750256937307297, "percentage": 55.06, "elapsed_time": "4:19:30", "remaining_time": "3:31:47"}
|
| 913 |
+
{"current_steps": 670, "total_steps": 1215, "loss": 0.3441, "lr": 1.9913771740510426e-05, "epoch": 2.7543679342240495, "percentage": 55.14, "elapsed_time": "4:19:53", "remaining_time": "3:31:24"}
|
| 914 |
+
{"current_steps": 671, "total_steps": 1215, "loss": 0.3327, "lr": 1.9856287025712172e-05, "epoch": 2.7584789311408016, "percentage": 55.23, "elapsed_time": "4:20:15", "remaining_time": "3:30:59"}
|
| 915 |
+
{"current_steps": 672, "total_steps": 1215, "loss": 0.3325, "lr": 1.979880349819924e-05, "epoch": 2.762589928057554, "percentage": 55.31, "elapsed_time": "4:20:37", "remaining_time": "3:30:36"}
|
| 916 |
+
{"current_steps": 673, "total_steps": 1215, "loss": 0.329, "lr": 1.974132163287203e-05, "epoch": 2.766700924974306, "percentage": 55.39, "elapsed_time": "4:21:01", "remaining_time": "3:30:12"}
|
| 917 |
+
{"current_steps": 674, "total_steps": 1215, "loss": 0.3319, "lr": 1.9683841904617217e-05, "epoch": 2.7708119218910587, "percentage": 55.47, "elapsed_time": "4:21:24", "remaining_time": "3:29:49"}
|
| 918 |
+
{"current_steps": 675, "total_steps": 1215, "loss": 0.3313, "lr": 1.9626364788303796e-05, "epoch": 2.774922918807811, "percentage": 55.56, "elapsed_time": "4:21:46", "remaining_time": "3:29:25"}
|
| 919 |
+
{"current_steps": 676, "total_steps": 1215, "loss": 0.3359, "lr": 1.956889075877921e-05, "epoch": 2.779033915724563, "percentage": 55.64, "elapsed_time": "4:22:09", "remaining_time": "3:29:01"}
|
| 920 |
+
{"current_steps": 677, "total_steps": 1215, "loss": 0.3269, "lr": 1.9511420290865387e-05, "epoch": 2.7831449126413155, "percentage": 55.72, "elapsed_time": "4:22:30", "remaining_time": "3:28:36"}
|
| 921 |
+
{"current_steps": 678, "total_steps": 1215, "loss": 0.3315, "lr": 1.945395385935483e-05, "epoch": 2.787255909558068, "percentage": 55.8, "elapsed_time": "4:22:52", "remaining_time": "3:28:12"}
|
| 922 |
+
{"current_steps": 679, "total_steps": 1215, "loss": 0.317, "lr": 1.9396491939006693e-05, "epoch": 2.79136690647482, "percentage": 55.88, "elapsed_time": "4:23:15", "remaining_time": "3:27:49"}
|
| 923 |
+
{"current_steps": 680, "total_steps": 1215, "loss": 0.3355, "lr": 1.9339035004542883e-05, "epoch": 2.795477903391572, "percentage": 55.97, "elapsed_time": "4:23:38", "remaining_time": "3:27:25"}
|
| 924 |
+
{"current_steps": 681, "total_steps": 1215, "loss": 0.3274, "lr": 1.9281583530644087e-05, "epoch": 2.7995889003083247, "percentage": 56.05, "elapsed_time": "4:23:59", "remaining_time": "3:27:00"}
|
| 925 |
+
{"current_steps": 682, "total_steps": 1215, "loss": 0.3161, "lr": 1.9224137991945898e-05, "epoch": 2.8036998972250773, "percentage": 56.13, "elapsed_time": "4:24:22", "remaining_time": "3:26:37"}
|
| 926 |
+
{"current_steps": 683, "total_steps": 1215, "loss": 0.3326, "lr": 1.9166698863034865e-05, "epoch": 2.8078108941418294, "percentage": 56.21, "elapsed_time": "4:24:45", "remaining_time": "3:26:13"}
|
| 927 |
+
{"current_steps": 684, "total_steps": 1215, "loss": 0.3306, "lr": 1.910926661844459e-05, "epoch": 2.8119218910585815, "percentage": 56.3, "elapsed_time": "4:25:08", "remaining_time": "3:25:50"}
|
| 928 |
+
{"current_steps": 685, "total_steps": 1215, "loss": 0.3285, "lr": 1.905184173265179e-05, "epoch": 2.816032887975334, "percentage": 56.38, "elapsed_time": "4:25:32", "remaining_time": "3:25:27"}
|
| 929 |
+
{"current_steps": 686, "total_steps": 1215, "loss": 0.3315, "lr": 1.89944246800724e-05, "epoch": 2.8201438848920866, "percentage": 56.46, "elapsed_time": "4:25:54", "remaining_time": "3:25:02"}
|
| 930 |
+
{"current_steps": 687, "total_steps": 1215, "loss": 0.343, "lr": 1.8937015935057637e-05, "epoch": 2.8242548818088387, "percentage": 56.54, "elapsed_time": "4:26:17", "remaining_time": "3:24:39"}
|
| 931 |
+
{"current_steps": 688, "total_steps": 1215, "loss": 0.3361, "lr": 1.887961597189008e-05, "epoch": 2.8283658787255908, "percentage": 56.63, "elapsed_time": "4:26:39", "remaining_time": "3:24:15"}
|
| 932 |
+
{"current_steps": 689, "total_steps": 1215, "loss": 0.336, "lr": 1.8822225264779757e-05, "epoch": 2.8324768756423433, "percentage": 56.71, "elapsed_time": "4:27:02", "remaining_time": "3:23:51"}
|
| 933 |
+
{"current_steps": 690, "total_steps": 1215, "loss": 0.3155, "lr": 1.8764844287860235e-05, "epoch": 2.836587872559096, "percentage": 56.79, "elapsed_time": "4:27:24", "remaining_time": "3:23:27"}
|
| 934 |
+
{"current_steps": 691, "total_steps": 1215, "loss": 0.3347, "lr": 1.8707473515184686e-05, "epoch": 2.840698869475848, "percentage": 56.87, "elapsed_time": "4:27:47", "remaining_time": "3:23:04"}
|
| 935 |
+
{"current_steps": 692, "total_steps": 1215, "loss": 0.3261, "lr": 1.8650113420721985e-05, "epoch": 2.8448098663926, "percentage": 56.95, "elapsed_time": "4:28:11", "remaining_time": "3:22:41"}
|
| 936 |
+
{"current_steps": 693, "total_steps": 1215, "loss": 0.3269, "lr": 1.8592764478352788e-05, "epoch": 2.8489208633093526, "percentage": 57.04, "elapsed_time": "4:28:34", "remaining_time": "3:22:18"}
|
| 937 |
+
{"current_steps": 694, "total_steps": 1215, "loss": 0.3273, "lr": 1.8535427161865617e-05, "epoch": 2.8530318602261047, "percentage": 57.12, "elapsed_time": "4:28:57", "remaining_time": "3:21:54"}
|
| 938 |
+
{"current_steps": 695, "total_steps": 1215, "loss": 0.3336, "lr": 1.8478101944952946e-05, "epoch": 2.857142857142857, "percentage": 57.2, "elapsed_time": "4:29:21", "remaining_time": "3:21:31"}
|
| 939 |
+
{"current_steps": 696, "total_steps": 1215, "loss": 0.3285, "lr": 1.842078930120729e-05, "epoch": 2.8612538540596093, "percentage": 57.28, "elapsed_time": "4:29:45", "remaining_time": "3:21:09"}
|
| 940 |
+
{"current_steps": 697, "total_steps": 1215, "loss": 0.3415, "lr": 1.836348970411729e-05, "epoch": 2.865364850976362, "percentage": 57.37, "elapsed_time": "4:30:08", "remaining_time": "3:20:45"}
|
| 941 |
+
{"current_steps": 698, "total_steps": 1215, "loss": 0.3324, "lr": 1.8306203627063803e-05, "epoch": 2.869475847893114, "percentage": 57.45, "elapsed_time": "4:30:31", "remaining_time": "3:20:22"}
|
| 942 |
+
{"current_steps": 699, "total_steps": 1215, "loss": 0.3327, "lr": 1.8248931543315974e-05, "epoch": 2.8735868448098665, "percentage": 57.53, "elapsed_time": "4:30:54", "remaining_time": "3:19:59"}
|
| 943 |
+
{"current_steps": 700, "total_steps": 1215, "loss": 0.336, "lr": 1.8191673926027386e-05, "epoch": 2.8776978417266186, "percentage": 57.61, "elapsed_time": "4:31:17", "remaining_time": "3:19:35"}
|
| 944 |
+
{"current_steps": 701, "total_steps": 1215, "loss": 0.3366, "lr": 1.813443124823206e-05, "epoch": 2.881808838643371, "percentage": 57.7, "elapsed_time": "4:31:39", "remaining_time": "3:19:11"}
|
| 945 |
+
{"current_steps": 702, "total_steps": 1215, "loss": 0.3279, "lr": 1.807720398284062e-05, "epoch": 2.885919835560123, "percentage": 57.78, "elapsed_time": "4:32:02", "remaining_time": "3:18:48"}
|
| 946 |
+
{"current_steps": 703, "total_steps": 1215, "loss": 0.3337, "lr": 1.801999260263635e-05, "epoch": 2.8900308324768758, "percentage": 57.86, "elapsed_time": "4:32:26", "remaining_time": "3:18:25"}
|
| 947 |
+
{"current_steps": 704, "total_steps": 1215, "loss": 0.3244, "lr": 1.7962797580271303e-05, "epoch": 2.894141829393628, "percentage": 57.94, "elapsed_time": "4:32:49", "remaining_time": "3:18:01"}
|
| 948 |
+
{"current_steps": 705, "total_steps": 1215, "loss": 0.3341, "lr": 1.790561938826239e-05, "epoch": 2.8982528263103804, "percentage": 58.02, "elapsed_time": "4:33:13", "remaining_time": "3:17:38"}
|
| 949 |
+
{"current_steps": 706, "total_steps": 1215, "loss": 0.3177, "lr": 1.784845849898748e-05, "epoch": 2.9023638232271325, "percentage": 58.11, "elapsed_time": "4:33:35", "remaining_time": "3:17:14"}
|
| 950 |
+
{"current_steps": 707, "total_steps": 1215, "loss": 0.3199, "lr": 1.7791315384681488e-05, "epoch": 2.906474820143885, "percentage": 58.19, "elapsed_time": "4:33:58", "remaining_time": "3:16:51"}
|
| 951 |
+
{"current_steps": 708, "total_steps": 1215, "loss": 0.3276, "lr": 1.7734190517432498e-05, "epoch": 2.910585817060637, "percentage": 58.27, "elapsed_time": "4:34:22", "remaining_time": "3:16:28"}
|
| 952 |
+
{"current_steps": 709, "total_steps": 1215, "loss": 0.3252, "lr": 1.7677084369177823e-05, "epoch": 2.9146968139773897, "percentage": 58.35, "elapsed_time": "4:34:46", "remaining_time": "3:16:05"}
|
| 953 |
+
{"current_steps": 710, "total_steps": 1215, "loss": 0.3269, "lr": 1.7619997411700146e-05, "epoch": 2.9188078108941418, "percentage": 58.44, "elapsed_time": "4:35:08", "remaining_time": "3:15:41"}
|
| 954 |
+
{"current_steps": 711, "total_steps": 1215, "loss": 0.3221, "lr": 1.7562930116623602e-05, "epoch": 2.9229188078108943, "percentage": 58.52, "elapsed_time": "4:35:32", "remaining_time": "3:15:19"}
|
| 955 |
+
{"current_steps": 712, "total_steps": 1215, "loss": 0.3265, "lr": 1.750588295540988e-05, "epoch": 2.9270298047276464, "percentage": 58.6, "elapsed_time": "4:35:56", "remaining_time": "3:14:56"}
|
| 956 |
+
{"current_steps": 713, "total_steps": 1215, "loss": 0.331, "lr": 1.7448856399354335e-05, "epoch": 2.931140801644399, "percentage": 58.68, "elapsed_time": "4:36:19", "remaining_time": "3:14:33"}
|
| 957 |
+
{"current_steps": 714, "total_steps": 1215, "loss": 0.3133, "lr": 1.7391850919582097e-05, "epoch": 2.935251798561151, "percentage": 58.77, "elapsed_time": "4:36:43", "remaining_time": "3:14:10"}
|
| 958 |
+
{"current_steps": 715, "total_steps": 1215, "loss": 0.3345, "lr": 1.733486698704417e-05, "epoch": 2.939362795477903, "percentage": 58.85, "elapsed_time": "4:37:06", "remaining_time": "3:13:46"}
|
| 959 |
+
{"current_steps": 716, "total_steps": 1215, "loss": 0.3125, "lr": 1.7277905072513538e-05, "epoch": 2.9434737923946557, "percentage": 58.93, "elapsed_time": "4:37:29", "remaining_time": "3:13:23"}
|
| 960 |
+
{"current_steps": 717, "total_steps": 1215, "loss": 0.3329, "lr": 1.7220965646581304e-05, "epoch": 2.947584789311408, "percentage": 59.01, "elapsed_time": "4:37:52", "remaining_time": "3:13:00"}
|
| 961 |
+
{"current_steps": 718, "total_steps": 1215, "loss": 0.342, "lr": 1.7164049179652762e-05, "epoch": 2.9516957862281603, "percentage": 59.09, "elapsed_time": "4:38:15", "remaining_time": "3:12:36"}
|
| 962 |
+
{"current_steps": 719, "total_steps": 1215, "loss": 0.3317, "lr": 1.7107156141943536e-05, "epoch": 2.9558067831449124, "percentage": 59.18, "elapsed_time": "4:38:38", "remaining_time": "3:12:13"}
|
| 963 |
+
{"current_steps": 720, "total_steps": 1215, "loss": 0.338, "lr": 1.7050287003475684e-05, "epoch": 2.959917780061665, "percentage": 59.26, "elapsed_time": "4:39:01", "remaining_time": "3:11:49"}
|
| 964 |
+
{"current_steps": 721, "total_steps": 1215, "loss": 0.3221, "lr": 1.699344223407384e-05, "epoch": 2.9640287769784175, "percentage": 59.34, "elapsed_time": "4:39:22", "remaining_time": "3:11:25"}
|
| 965 |
+
{"current_steps": 722, "total_steps": 1215, "loss": 0.3272, "lr": 1.6936622303361292e-05, "epoch": 2.9681397738951696, "percentage": 59.42, "elapsed_time": "4:39:46", "remaining_time": "3:11:01"}
|
| 966 |
+
{"current_steps": 723, "total_steps": 1215, "loss": 0.3283, "lr": 1.6879827680756132e-05, "epoch": 2.9722507708119217, "percentage": 59.51, "elapsed_time": "4:40:09", "remaining_time": "3:10:38"}
|
| 967 |
+
{"current_steps": 724, "total_steps": 1215, "loss": 0.3297, "lr": 1.682305883546737e-05, "epoch": 2.9763617677286742, "percentage": 59.59, "elapsed_time": "4:40:32", "remaining_time": "3:10:15"}
|
| 968 |
+
{"current_steps": 725, "total_steps": 1215, "loss": 0.3314, "lr": 1.6766316236491046e-05, "epoch": 2.9804727646454268, "percentage": 59.67, "elapsed_time": "4:40:54", "remaining_time": "3:09:51"}
|
| 969 |
+
{"current_steps": 726, "total_steps": 1215, "loss": 0.3238, "lr": 1.6709600352606382e-05, "epoch": 2.984583761562179, "percentage": 59.75, "elapsed_time": "4:41:16", "remaining_time": "3:09:26"}
|
| 970 |
+
{"current_steps": 727, "total_steps": 1215, "loss": 0.3274, "lr": 1.665291165237188e-05, "epoch": 2.988694758478931, "percentage": 59.84, "elapsed_time": "4:41:39", "remaining_time": "3:09:04"}
|
| 971 |
+
{"current_steps": 728, "total_steps": 1215, "loss": 0.3328, "lr": 1.6596250604121468e-05, "epoch": 2.9928057553956835, "percentage": 59.92, "elapsed_time": "4:42:02", "remaining_time": "3:08:40"}
|
| 972 |
+
{"current_steps": 729, "total_steps": 1215, "loss": 0.3335, "lr": 1.653961767596063e-05, "epoch": 2.996916752312436, "percentage": 60.0, "elapsed_time": "4:42:26", "remaining_time": "3:08:17"}
|
| 973 |
+
{"current_steps": 730, "total_steps": 1215, "loss": 0.2946, "lr": 1.6483013335762536e-05, "epoch": 3.001027749229188, "percentage": 60.08, "elapsed_time": "4:44:31", "remaining_time": "3:09:02"}
|
| 974 |
+
{"current_steps": 731, "total_steps": 1215, "loss": 0.2781, "lr": 1.6426438051164168e-05, "epoch": 3.0051387461459402, "percentage": 60.16, "elapsed_time": "4:44:55", "remaining_time": "3:08:39"}
|
| 975 |
+
{"current_steps": 732, "total_steps": 1215, "loss": 0.2843, "lr": 1.636989228956248e-05, "epoch": 3.0092497430626928, "percentage": 60.25, "elapsed_time": "4:45:19", "remaining_time": "3:08:15"}
|
| 976 |
+
{"current_steps": 733, "total_steps": 1215, "loss": 0.2747, "lr": 1.631337651811051e-05, "epoch": 3.013360739979445, "percentage": 60.33, "elapsed_time": "4:45:42", "remaining_time": "3:07:52"}
|
| 977 |
+
{"current_steps": 734, "total_steps": 1215, "loss": 0.2728, "lr": 1.6256891203713533e-05, "epoch": 3.0174717368961974, "percentage": 60.41, "elapsed_time": "4:46:03", "remaining_time": "3:07:27"}
|
| 978 |
+
{"current_steps": 735, "total_steps": 1215, "loss": 0.2736, "lr": 1.6200436813025208e-05, "epoch": 3.0215827338129495, "percentage": 60.49, "elapsed_time": "4:46:25", "remaining_time": "3:07:03"}
|
| 979 |
+
{"current_steps": 736, "total_steps": 1215, "loss": 0.288, "lr": 1.6144013812443712e-05, "epoch": 3.025693730729702, "percentage": 60.58, "elapsed_time": "4:46:47", "remaining_time": "3:06:38"}
|
| 980 |
+
{"current_steps": 737, "total_steps": 1215, "loss": 0.2675, "lr": 1.60876226681079e-05, "epoch": 3.029804727646454, "percentage": 60.66, "elapsed_time": "4:47:10", "remaining_time": "3:06:15"}
|
| 981 |
+
{"current_steps": 738, "total_steps": 1215, "loss": 0.2696, "lr": 1.6031263845893436e-05, "epoch": 3.0339157245632067, "percentage": 60.74, "elapsed_time": "4:47:34", "remaining_time": "3:05:52"}
|
| 982 |
+
{"current_steps": 739, "total_steps": 1215, "loss": 0.2806, "lr": 1.5974937811408964e-05, "epoch": 3.038026721479959, "percentage": 60.82, "elapsed_time": "4:47:57", "remaining_time": "3:05:28"}
|
| 983 |
+
{"current_steps": 740, "total_steps": 1215, "loss": 0.2669, "lr": 1.5918645029992237e-05, "epoch": 3.0421377183967113, "percentage": 60.91, "elapsed_time": "4:48:19", "remaining_time": "3:05:04"}
|
| 984 |
+
{"current_steps": 741, "total_steps": 1215, "loss": 0.2827, "lr": 1.5862385966706324e-05, "epoch": 3.0462487153134634, "percentage": 60.99, "elapsed_time": "4:48:43", "remaining_time": "3:04:41"}
|
| 985 |
+
{"current_steps": 742, "total_steps": 1215, "loss": 0.2772, "lr": 1.580616108633569e-05, "epoch": 3.050359712230216, "percentage": 61.07, "elapsed_time": "4:49:06", "remaining_time": "3:04:17"}
|
| 986 |
+
{"current_steps": 743, "total_steps": 1215, "loss": 0.2813, "lr": 1.5749970853382416e-05, "epoch": 3.054470709146968, "percentage": 61.15, "elapsed_time": "4:49:29", "remaining_time": "3:03:54"}
|
| 987 |
+
{"current_steps": 744, "total_steps": 1215, "loss": 0.2786, "lr": 1.5693815732062346e-05, "epoch": 3.0585817060637206, "percentage": 61.23, "elapsed_time": "4:49:51", "remaining_time": "3:03:30"}
|
| 988 |
+
{"current_steps": 745, "total_steps": 1215, "loss": 0.2781, "lr": 1.563769618630124e-05, "epoch": 3.0626927029804727, "percentage": 61.32, "elapsed_time": "4:50:15", "remaining_time": "3:03:06"}
|
| 989 |
+
{"current_steps": 746, "total_steps": 1215, "loss": 0.2811, "lr": 1.558161267973096e-05, "epoch": 3.0668036998972252, "percentage": 61.4, "elapsed_time": "4:50:39", "remaining_time": "3:02:43"}
|
| 990 |
+
{"current_steps": 747, "total_steps": 1215, "loss": 0.2731, "lr": 1.552556567568562e-05, "epoch": 3.0709146968139773, "percentage": 61.48, "elapsed_time": "4:51:01", "remaining_time": "3:02:19"}
|
| 991 |
+
{"current_steps": 748, "total_steps": 1215, "loss": 0.273, "lr": 1.5469555637197775e-05, "epoch": 3.07502569373073, "percentage": 61.56, "elapsed_time": "4:51:24", "remaining_time": "3:01:56"}
|
| 992 |
+
{"current_steps": 749, "total_steps": 1215, "loss": 0.2737, "lr": 1.541358302699459e-05, "epoch": 3.079136690647482, "percentage": 61.65, "elapsed_time": "4:51:47", "remaining_time": "3:01:32"}
|
| 993 |
+
{"current_steps": 750, "total_steps": 1215, "loss": 0.2719, "lr": 1.535764830749401e-05, "epoch": 3.0832476875642345, "percentage": 61.73, "elapsed_time": "4:52:10", "remaining_time": "3:01:09"}
|
| 994 |
+
{"current_steps": 751, "total_steps": 1215, "loss": 0.2702, "lr": 1.5301751940800947e-05, "epoch": 3.0873586844809866, "percentage": 61.81, "elapsed_time": "4:52:32", "remaining_time": "3:00:44"}
|
| 995 |
+
{"current_steps": 752, "total_steps": 1215, "loss": 0.2746, "lr": 1.5245894388703473e-05, "epoch": 3.091469681397739, "percentage": 61.89, "elapsed_time": "4:52:55", "remaining_time": "3:00:21"}
|
| 996 |
+
{"current_steps": 753, "total_steps": 1215, "loss": 0.2741, "lr": 1.5190076112668975e-05, "epoch": 3.0955806783144912, "percentage": 61.98, "elapsed_time": "4:53:19", "remaining_time": "2:59:58"}
|
| 997 |
+
{"current_steps": 754, "total_steps": 1215, "loss": 0.2609, "lr": 1.5134297573840373e-05, "epoch": 3.099691675231244, "percentage": 62.06, "elapsed_time": "4:53:42", "remaining_time": "2:59:34"}
|
| 998 |
+
{"current_steps": 755, "total_steps": 1215, "loss": 0.2683, "lr": 1.507855923303229e-05, "epoch": 3.103802672147996, "percentage": 62.14, "elapsed_time": "4:54:04", "remaining_time": "2:59:10"}
|
| 999 |
+
{"current_steps": 756, "total_steps": 1215, "loss": 0.2753, "lr": 1.5022861550727261e-05, "epoch": 3.1079136690647484, "percentage": 62.22, "elapsed_time": "4:54:26", "remaining_time": "2:58:46"}
|
| 1000 |
+
{"current_steps": 757, "total_steps": 1215, "loss": 0.2674, "lr": 1.4967204987071916e-05, "epoch": 3.1120246659815005, "percentage": 62.3, "elapsed_time": "4:54:49", "remaining_time": "2:58:22"}
|
| 1001 |
+
{"current_steps": 758, "total_steps": 1215, "loss": 0.2766, "lr": 1.491159000187318e-05, "epoch": 3.1161356628982526, "percentage": 62.39, "elapsed_time": "4:55:13", "remaining_time": "2:57:59"}
|
| 1002 |
+
{"current_steps": 759, "total_steps": 1215, "loss": 0.2817, "lr": 1.4856017054594487e-05, "epoch": 3.120246659815005, "percentage": 62.47, "elapsed_time": "4:55:35", "remaining_time": "2:57:35"}
|
| 1003 |
+
{"current_steps": 760, "total_steps": 1215, "loss": 0.2692, "lr": 1.4800486604351953e-05, "epoch": 3.1243576567317572, "percentage": 62.55, "elapsed_time": "4:55:58", "remaining_time": "2:57:11"}
|
| 1004 |
+
{"current_steps": 761, "total_steps": 1215, "loss": 0.2881, "lr": 1.4744999109910642e-05, "epoch": 3.12846865364851, "percentage": 62.63, "elapsed_time": "4:56:21", "remaining_time": "2:56:48"}
|
| 1005 |
+
{"current_steps": 762, "total_steps": 1215, "loss": 0.2811, "lr": 1.4689555029680706e-05, "epoch": 3.132579650565262, "percentage": 62.72, "elapsed_time": "4:56:43", "remaining_time": "2:56:24"}
|
| 1006 |
+
{"current_steps": 763, "total_steps": 1215, "loss": 0.2748, "lr": 1.4634154821713642e-05, "epoch": 3.1366906474820144, "percentage": 62.8, "elapsed_time": "4:57:06", "remaining_time": "2:56:00"}
|
| 1007 |
+
{"current_steps": 764, "total_steps": 1215, "loss": 0.2775, "lr": 1.4578798943698495e-05, "epoch": 3.1408016443987665, "percentage": 62.88, "elapsed_time": "4:57:29", "remaining_time": "2:55:36"}
|
| 1008 |
+
{"current_steps": 765, "total_steps": 1215, "loss": 0.274, "lr": 1.4523487852958078e-05, "epoch": 3.144912641315519, "percentage": 62.96, "elapsed_time": "4:57:52", "remaining_time": "2:55:13"}
|
| 1009 |
+
{"current_steps": 766, "total_steps": 1215, "loss": 0.2846, "lr": 1.4468222006445194e-05, "epoch": 3.149023638232271, "percentage": 63.05, "elapsed_time": "4:58:16", "remaining_time": "2:54:50"}
|
| 1010 |
+
{"current_steps": 767, "total_steps": 1215, "loss": 0.2751, "lr": 1.4413001860738857e-05, "epoch": 3.1531346351490237, "percentage": 63.13, "elapsed_time": "4:58:39", "remaining_time": "2:54:26"}
|
| 1011 |
+
{"current_steps": 768, "total_steps": 1215, "loss": 0.2763, "lr": 1.4357827872040533e-05, "epoch": 3.157245632065776, "percentage": 63.21, "elapsed_time": "4:59:02", "remaining_time": "2:54:03"}
|
| 1012 |
+
{"current_steps": 769, "total_steps": 1215, "loss": 0.273, "lr": 1.4302700496170348e-05, "epoch": 3.1613566289825283, "percentage": 63.29, "elapsed_time": "4:59:25", "remaining_time": "2:53:39"}
|
| 1013 |
+
{"current_steps": 770, "total_steps": 1215, "loss": 0.2733, "lr": 1.424762018856335e-05, "epoch": 3.1654676258992804, "percentage": 63.37, "elapsed_time": "4:59:47", "remaining_time": "2:53:15"}
|
| 1014 |
+
{"current_steps": 771, "total_steps": 1215, "loss": 0.2739, "lr": 1.4192587404265723e-05, "epoch": 3.169578622816033, "percentage": 63.46, "elapsed_time": "5:00:10", "remaining_time": "2:52:51"}
|
| 1015 |
+
{"current_steps": 772, "total_steps": 1215, "loss": 0.2819, "lr": 1.4137602597931039e-05, "epoch": 3.173689619732785, "percentage": 63.54, "elapsed_time": "5:00:34", "remaining_time": "2:52:28"}
|
| 1016 |
+
{"current_steps": 773, "total_steps": 1215, "loss": 0.2792, "lr": 1.4082666223816503e-05, "epoch": 3.1778006166495376, "percentage": 63.62, "elapsed_time": "5:00:56", "remaining_time": "2:52:04"}
|
| 1017 |
+
{"current_steps": 774, "total_steps": 1215, "loss": 0.2777, "lr": 1.4027778735779194e-05, "epoch": 3.1819116135662897, "percentage": 63.7, "elapsed_time": "5:01:20", "remaining_time": "2:51:41"}
|
| 1018 |
+
{"current_steps": 775, "total_steps": 1215, "loss": 0.2765, "lr": 1.397294058727232e-05, "epoch": 3.1860226104830422, "percentage": 63.79, "elapsed_time": "5:01:42", "remaining_time": "2:51:17"}
|
| 1019 |
+
{"current_steps": 776, "total_steps": 1215, "loss": 0.2859, "lr": 1.3918152231341466e-05, "epoch": 3.1901336073997943, "percentage": 63.87, "elapsed_time": "5:02:06", "remaining_time": "2:50:54"}
|
| 1020 |
+
{"current_steps": 777, "total_steps": 1215, "loss": 0.2739, "lr": 1.3863414120620866e-05, "epoch": 3.194244604316547, "percentage": 63.95, "elapsed_time": "5:02:29", "remaining_time": "2:50:30"}
|
| 1021 |
+
{"current_steps": 778, "total_steps": 1215, "loss": 0.2854, "lr": 1.3808726707329636e-05, "epoch": 3.198355601233299, "percentage": 64.03, "elapsed_time": "5:02:53", "remaining_time": "2:50:07"}
|
| 1022 |
+
{"current_steps": 779, "total_steps": 1215, "loss": 0.2739, "lr": 1.3754090443268073e-05, "epoch": 3.2024665981500515, "percentage": 64.12, "elapsed_time": "5:03:15", "remaining_time": "2:49:44"}
|
| 1023 |
+
{"current_steps": 780, "total_steps": 1215, "loss": 0.2779, "lr": 1.3699505779813885e-05, "epoch": 3.2065775950668036, "percentage": 64.2, "elapsed_time": "5:03:38", "remaining_time": "2:49:20"}
|
| 1024 |
+
{"current_steps": 781, "total_steps": 1215, "loss": 0.2819, "lr": 1.3644973167918509e-05, "epoch": 3.210688591983556, "percentage": 64.28, "elapsed_time": "5:04:02", "remaining_time": "2:48:57"}
|
| 1025 |
+
{"current_steps": 782, "total_steps": 1215, "loss": 0.2912, "lr": 1.3590493058103334e-05, "epoch": 3.2147995889003083, "percentage": 64.36, "elapsed_time": "5:04:24", "remaining_time": "2:48:33"}
|
| 1026 |
+
{"current_steps": 783, "total_steps": 1215, "loss": 0.2625, "lr": 1.353606590045601e-05, "epoch": 3.218910585817061, "percentage": 64.44, "elapsed_time": "5:04:48", "remaining_time": "2:48:10"}
|
| 1027 |
+
{"current_steps": 784, "total_steps": 1215, "loss": 0.2716, "lr": 1.3481692144626723e-05, "epoch": 3.223021582733813, "percentage": 64.53, "elapsed_time": "5:05:11", "remaining_time": "2:47:46"}
|
| 1028 |
+
{"current_steps": 785, "total_steps": 1215, "loss": 0.2833, "lr": 1.3427372239824478e-05, "epoch": 3.2271325796505654, "percentage": 64.61, "elapsed_time": "5:05:34", "remaining_time": "2:47:23"}
|
| 1029 |
+
{"current_steps": 786, "total_steps": 1215, "loss": 0.2815, "lr": 1.3373106634813395e-05, "epoch": 3.2312435765673175, "percentage": 64.69, "elapsed_time": "5:05:57", "remaining_time": "2:46:59"}
|
| 1030 |
+
{"current_steps": 787, "total_steps": 1215, "loss": 0.2737, "lr": 1.3318895777908989e-05, "epoch": 3.23535457348407, "percentage": 64.77, "elapsed_time": "5:06:20", "remaining_time": "2:46:35"}
|