Training in progress, epoch 3
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1cd705d43bf2ee195f6da60111faed90743ebac4c04f149598429abe9e39e4f9
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fe071e3a4141e03a8b80672bfa60da43ca008145d34291daf61c0add4c059f42
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8d5012e7deb44193dda31bc4fdfea1bbb030ad14b9d44c8b1580d96723dc85dc
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8b91b1c156683bf598c38137c0d098276e568097ee68a560b9aa59e3deb387a1
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -858,3 +858,249 @@
|
|
| 858 |
{"current_steps": 743, "total_steps": 1230, "loss": 0.2682, "lr": 1.624791353909428e-05, "epoch": 3.016708860759494, "percentage": 60.41, "elapsed_time": "2:16:42", "remaining_time": "1:29:36"}
|
| 859 |
{"current_steps": 744, "total_steps": 1230, "loss": 0.2685, "lr": 1.619217781670663e-05, "epoch": 3.020759493670886, "percentage": 60.49, "elapsed_time": "2:17:13", "remaining_time": "1:29:38"}
|
| 860 |
{"current_steps": 745, "total_steps": 1230, "loss": 0.2529, "lr": 1.6136472761995373e-05, "epoch": 3.0248101265822784, "percentage": 60.57, "elapsed_time": "2:17:42", "remaining_time": "1:29:38"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 858 |
{"current_steps": 743, "total_steps": 1230, "loss": 0.2682, "lr": 1.624791353909428e-05, "epoch": 3.016708860759494, "percentage": 60.41, "elapsed_time": "2:16:42", "remaining_time": "1:29:36"}
|
| 859 |
{"current_steps": 744, "total_steps": 1230, "loss": 0.2685, "lr": 1.619217781670663e-05, "epoch": 3.020759493670886, "percentage": 60.49, "elapsed_time": "2:17:13", "remaining_time": "1:29:38"}
|
| 860 |
{"current_steps": 745, "total_steps": 1230, "loss": 0.2529, "lr": 1.6136472761995373e-05, "epoch": 3.0248101265822784, "percentage": 60.57, "elapsed_time": "2:17:42", "remaining_time": "1:29:38"}
|
| 861 |
+
{"current_steps": 746, "total_steps": 1230, "loss": 0.2782, "lr": 1.608079882360134e-05, "epoch": 3.028860759493671, "percentage": 60.65, "elapsed_time": "2:18:14", "remaining_time": "1:29:41"}
|
| 862 |
+
{"current_steps": 747, "total_steps": 1230, "loss": 0.2682, "lr": 1.60251564499148e-05, "epoch": 3.0329113924050635, "percentage": 60.73, "elapsed_time": "2:18:46", "remaining_time": "1:29:43"}
|
| 863 |
+
{"current_steps": 748, "total_steps": 1230, "loss": 0.2738, "lr": 1.596954608907176e-05, "epoch": 3.0369620253164555, "percentage": 60.81, "elapsed_time": "2:19:22", "remaining_time": "1:29:48"}
|
| 864 |
+
{"current_steps": 749, "total_steps": 1230, "loss": 0.2675, "lr": 1.591396818895043e-05, "epoch": 3.041012658227848, "percentage": 60.89, "elapsed_time": "2:19:49", "remaining_time": "1:29:47"}
|
| 865 |
+
{"current_steps": 750, "total_steps": 1230, "loss": 0.2831, "lr": 1.585842319716759e-05, "epoch": 3.0450632911392406, "percentage": 60.98, "elapsed_time": "2:20:25", "remaining_time": "1:29:52"}
|
| 866 |
+
{"current_steps": 751, "total_steps": 1230, "loss": 0.2559, "lr": 1.5802911561074944e-05, "epoch": 3.049113924050633, "percentage": 61.06, "elapsed_time": "2:20:52", "remaining_time": "1:29:51"}
|
| 867 |
+
{"current_steps": 752, "total_steps": 1230, "loss": 0.2686, "lr": 1.5747433727755595e-05, "epoch": 3.053164556962025, "percentage": 61.14, "elapsed_time": "2:21:25", "remaining_time": "1:29:53"}
|
| 868 |
+
{"current_steps": 753, "total_steps": 1230, "loss": 0.2754, "lr": 1.5691990144020376e-05, "epoch": 3.0572151898734177, "percentage": 61.22, "elapsed_time": "2:21:53", "remaining_time": "1:29:52"}
|
| 869 |
+
{"current_steps": 754, "total_steps": 1230, "loss": 0.2741, "lr": 1.5636581256404297e-05, "epoch": 3.06126582278481, "percentage": 61.3, "elapsed_time": "2:22:23", "remaining_time": "1:29:53"}
|
| 870 |
+
{"current_steps": 755, "total_steps": 1230, "loss": 0.2636, "lr": 1.558120751116291e-05, "epoch": 3.0653164556962027, "percentage": 61.38, "elapsed_time": "2:22:50", "remaining_time": "1:29:51"}
|
| 871 |
+
{"current_steps": 756, "total_steps": 1230, "loss": 0.2629, "lr": 1.552586935426876e-05, "epoch": 3.0693670886075948, "percentage": 61.46, "elapsed_time": "2:23:21", "remaining_time": "1:29:53"}
|
| 872 |
+
{"current_steps": 757, "total_steps": 1230, "loss": 0.2488, "lr": 1.547056723140774e-05, "epoch": 3.0734177215189873, "percentage": 61.54, "elapsed_time": "2:23:47", "remaining_time": "1:29:50"}
|
| 873 |
+
{"current_steps": 758, "total_steps": 1230, "loss": 0.2667, "lr": 1.5415301587975565e-05, "epoch": 3.07746835443038, "percentage": 61.63, "elapsed_time": "2:24:24", "remaining_time": "1:29:55"}
|
| 874 |
+
{"current_steps": 759, "total_steps": 1230, "loss": 0.2429, "lr": 1.536007286907411e-05, "epoch": 3.0815189873417723, "percentage": 61.71, "elapsed_time": "2:24:55", "remaining_time": "1:29:55"}
|
| 875 |
+
{"current_steps": 760, "total_steps": 1230, "loss": 0.2908, "lr": 1.5304881519507896e-05, "epoch": 3.0855696202531644, "percentage": 61.79, "elapsed_time": "2:25:31", "remaining_time": "1:29:59"}
|
| 876 |
+
{"current_steps": 761, "total_steps": 1230, "loss": 0.2667, "lr": 1.5249727983780453e-05, "epoch": 3.089620253164557, "percentage": 61.87, "elapsed_time": "2:26:07", "remaining_time": "1:30:03"}
|
| 877 |
+
{"current_steps": 762, "total_steps": 1230, "loss": 0.243, "lr": 1.5194612706090786e-05, "epoch": 3.0936708860759494, "percentage": 61.95, "elapsed_time": "2:26:40", "remaining_time": "1:30:04"}
|
| 878 |
+
{"current_steps": 763, "total_steps": 1230, "loss": 0.2569, "lr": 1.5139536130329771e-05, "epoch": 3.097721518987342, "percentage": 62.03, "elapsed_time": "2:27:11", "remaining_time": "1:30:05"}
|
| 879 |
+
{"current_steps": 764, "total_steps": 1230, "loss": 0.2606, "lr": 1.508449870007656e-05, "epoch": 3.101772151898734, "percentage": 62.11, "elapsed_time": "2:27:41", "remaining_time": "1:30:04"}
|
| 880 |
+
{"current_steps": 765, "total_steps": 1230, "loss": 0.2398, "lr": 1.5029500858595056e-05, "epoch": 3.1058227848101265, "percentage": 62.2, "elapsed_time": "2:28:09", "remaining_time": "1:30:03"}
|
| 881 |
+
{"current_steps": 766, "total_steps": 1230, "loss": 0.243, "lr": 1.4974543048830328e-05, "epoch": 3.109873417721519, "percentage": 62.28, "elapsed_time": "2:28:40", "remaining_time": "1:30:03"}
|
| 882 |
+
{"current_steps": 767, "total_steps": 1230, "loss": 0.2768, "lr": 1.4919625713405e-05, "epoch": 3.1139240506329116, "percentage": 62.36, "elapsed_time": "2:29:15", "remaining_time": "1:30:06"}
|
| 883 |
+
{"current_steps": 768, "total_steps": 1230, "loss": 0.2924, "lr": 1.4864749294615756e-05, "epoch": 3.1179746835443036, "percentage": 62.44, "elapsed_time": "2:29:44", "remaining_time": "1:30:04"}
|
| 884 |
+
{"current_steps": 769, "total_steps": 1230, "loss": 0.2803, "lr": 1.4809914234429716e-05, "epoch": 3.122025316455696, "percentage": 62.52, "elapsed_time": "2:30:21", "remaining_time": "1:30:08"}
|
| 885 |
+
{"current_steps": 770, "total_steps": 1230, "loss": 0.2486, "lr": 1.4755120974480923e-05, "epoch": 3.1260759493670887, "percentage": 62.6, "elapsed_time": "2:30:51", "remaining_time": "1:30:07"}
|
| 886 |
+
{"current_steps": 771, "total_steps": 1230, "loss": 0.2661, "lr": 1.4700369956066771e-05, "epoch": 3.130126582278481, "percentage": 62.68, "elapsed_time": "2:31:23", "remaining_time": "1:30:07"}
|
| 887 |
+
{"current_steps": 772, "total_steps": 1230, "loss": 0.2514, "lr": 1.4645661620144413e-05, "epoch": 3.1341772151898732, "percentage": 62.76, "elapsed_time": "2:31:56", "remaining_time": "1:30:08"}
|
| 888 |
+
{"current_steps": 773, "total_steps": 1230, "loss": 0.264, "lr": 1.4590996407327284e-05, "epoch": 3.1382278481012658, "percentage": 62.85, "elapsed_time": "2:32:32", "remaining_time": "1:30:10"}
|
| 889 |
+
{"current_steps": 774, "total_steps": 1230, "loss": 0.268, "lr": 1.4536374757881487e-05, "epoch": 3.1422784810126583, "percentage": 62.93, "elapsed_time": "2:33:01", "remaining_time": "1:30:09"}
|
| 890 |
+
{"current_steps": 775, "total_steps": 1230, "loss": 0.2396, "lr": 1.4481797111722271e-05, "epoch": 3.146329113924051, "percentage": 63.01, "elapsed_time": "2:33:30", "remaining_time": "1:30:07"}
|
| 891 |
+
{"current_steps": 776, "total_steps": 1230, "loss": 0.2618, "lr": 1.4427263908410507e-05, "epoch": 3.150379746835443, "percentage": 63.09, "elapsed_time": "2:34:06", "remaining_time": "1:30:09"}
|
| 892 |
+
{"current_steps": 777, "total_steps": 1230, "loss": 0.2534, "lr": 1.4372775587149108e-05, "epoch": 3.1544303797468354, "percentage": 63.17, "elapsed_time": "2:34:43", "remaining_time": "1:30:12"}
|
| 893 |
+
{"current_steps": 778, "total_steps": 1230, "loss": 0.271, "lr": 1.4318332586779522e-05, "epoch": 3.158481012658228, "percentage": 63.25, "elapsed_time": "2:35:16", "remaining_time": "1:30:12"}
|
| 894 |
+
{"current_steps": 779, "total_steps": 1230, "loss": 0.2699, "lr": 1.4263935345778202e-05, "epoch": 3.1625316455696204, "percentage": 63.33, "elapsed_time": "2:35:44", "remaining_time": "1:30:09"}
|
| 895 |
+
{"current_steps": 780, "total_steps": 1230, "loss": 0.2474, "lr": 1.420958430225303e-05, "epoch": 3.1665822784810125, "percentage": 63.41, "elapsed_time": "2:36:15", "remaining_time": "1:30:08"}
|
| 896 |
+
{"current_steps": 781, "total_steps": 1230, "loss": 0.2655, "lr": 1.415527989393985e-05, "epoch": 3.170632911392405, "percentage": 63.5, "elapsed_time": "2:36:47", "remaining_time": "1:30:08"}
|
| 897 |
+
{"current_steps": 782, "total_steps": 1230, "loss": 0.2795, "lr": 1.410102255819891e-05, "epoch": 3.1746835443037975, "percentage": 63.58, "elapsed_time": "2:37:16", "remaining_time": "1:30:06"}
|
| 898 |
+
{"current_steps": 783, "total_steps": 1230, "loss": 0.2676, "lr": 1.404681273201131e-05, "epoch": 3.17873417721519, "percentage": 63.66, "elapsed_time": "2:37:50", "remaining_time": "1:30:06"}
|
| 899 |
+
{"current_steps": 784, "total_steps": 1230, "loss": 0.2635, "lr": 1.399265085197556e-05, "epoch": 3.182784810126582, "percentage": 63.74, "elapsed_time": "2:38:22", "remaining_time": "1:30:05"}
|
| 900 |
+
{"current_steps": 785, "total_steps": 1230, "loss": 0.2585, "lr": 1.393853735430398e-05, "epoch": 3.1868354430379746, "percentage": 63.82, "elapsed_time": "2:38:54", "remaining_time": "1:30:04"}
|
| 901 |
+
{"current_steps": 786, "total_steps": 1230, "loss": 0.267, "lr": 1.3884472674819246e-05, "epoch": 3.190886075949367, "percentage": 63.9, "elapsed_time": "2:39:24", "remaining_time": "1:30:02"}
|
| 902 |
+
{"current_steps": 787, "total_steps": 1230, "loss": 0.2739, "lr": 1.3830457248950864e-05, "epoch": 3.1949367088607596, "percentage": 63.98, "elapsed_time": "2:39:55", "remaining_time": "1:30:01"}
|
| 903 |
+
{"current_steps": 788, "total_steps": 1230, "loss": 0.2553, "lr": 1.377649151173163e-05, "epoch": 3.1989873417721517, "percentage": 64.07, "elapsed_time": "2:40:30", "remaining_time": "1:30:01"}
|
| 904 |
+
{"current_steps": 789, "total_steps": 1230, "loss": 0.251, "lr": 1.3722575897794181e-05, "epoch": 3.2030379746835442, "percentage": 64.15, "elapsed_time": "2:41:03", "remaining_time": "1:30:01"}
|
| 905 |
+
{"current_steps": 790, "total_steps": 1230, "loss": 0.2641, "lr": 1.3668710841367472e-05, "epoch": 3.2070886075949367, "percentage": 64.23, "elapsed_time": "2:41:36", "remaining_time": "1:30:00"}
|
| 906 |
+
{"current_steps": 791, "total_steps": 1230, "loss": 0.2902, "lr": 1.361489677627324e-05, "epoch": 3.2111392405063293, "percentage": 64.31, "elapsed_time": "2:42:09", "remaining_time": "1:29:59"}
|
| 907 |
+
{"current_steps": 792, "total_steps": 1230, "loss": 0.277, "lr": 1.3561134135922585e-05, "epoch": 3.2151898734177213, "percentage": 64.39, "elapsed_time": "2:42:46", "remaining_time": "1:30:01"}
|
| 908 |
+
{"current_steps": 793, "total_steps": 1230, "loss": 0.2725, "lr": 1.350742335331241e-05, "epoch": 3.219240506329114, "percentage": 64.47, "elapsed_time": "2:43:23", "remaining_time": "1:30:02"}
|
| 909 |
+
{"current_steps": 794, "total_steps": 1230, "loss": 0.259, "lr": 1.345376486102198e-05, "epoch": 3.2232911392405064, "percentage": 64.55, "elapsed_time": "2:43:57", "remaining_time": "1:30:01"}
|
| 910 |
+
{"current_steps": 795, "total_steps": 1230, "loss": 0.2506, "lr": 1.3400159091209414e-05, "epoch": 3.227341772151899, "percentage": 64.63, "elapsed_time": "2:44:27", "remaining_time": "1:29:59"}
|
| 911 |
+
{"current_steps": 796, "total_steps": 1230, "loss": 0.2511, "lr": 1.3346606475608216e-05, "epoch": 3.231392405063291, "percentage": 64.72, "elapsed_time": "2:45:03", "remaining_time": "1:29:59"}
|
| 912 |
+
{"current_steps": 797, "total_steps": 1230, "loss": 0.2521, "lr": 1.3293107445523781e-05, "epoch": 3.2354430379746835, "percentage": 64.8, "elapsed_time": "2:45:36", "remaining_time": "1:29:58"}
|
| 913 |
+
{"current_steps": 798, "total_steps": 1230, "loss": 0.2624, "lr": 1.3239662431829949e-05, "epoch": 3.239493670886076, "percentage": 64.88, "elapsed_time": "2:46:09", "remaining_time": "1:29:56"}
|
| 914 |
+
{"current_steps": 799, "total_steps": 1230, "loss": 0.2509, "lr": 1.3186271864965509e-05, "epoch": 3.2435443037974685, "percentage": 64.96, "elapsed_time": "2:46:41", "remaining_time": "1:29:54"}
|
| 915 |
+
{"current_steps": 800, "total_steps": 1230, "loss": 0.2553, "lr": 1.3132936174930756e-05, "epoch": 3.2475949367088606, "percentage": 65.04, "elapsed_time": "2:47:13", "remaining_time": "1:29:52"}
|
| 916 |
+
{"current_steps": 801, "total_steps": 1230, "loss": 0.2657, "lr": 1.3079655791283995e-05, "epoch": 3.251645569620253, "percentage": 65.12, "elapsed_time": "2:47:45", "remaining_time": "1:29:50"}
|
| 917 |
+
{"current_steps": 802, "total_steps": 1230, "loss": 0.2451, "lr": 1.3026431143138108e-05, "epoch": 3.2556962025316456, "percentage": 65.2, "elapsed_time": "2:48:18", "remaining_time": "1:29:49"}
|
| 918 |
+
{"current_steps": 803, "total_steps": 1230, "loss": 0.2752, "lr": 1.2973262659157114e-05, "epoch": 3.259746835443038, "percentage": 65.28, "elapsed_time": "2:48:52", "remaining_time": "1:29:48"}
|
| 919 |
+
{"current_steps": 804, "total_steps": 1230, "loss": 0.2381, "lr": 1.2920150767552651e-05, "epoch": 3.26379746835443, "percentage": 65.37, "elapsed_time": "2:49:24", "remaining_time": "1:29:45"}
|
| 920 |
+
{"current_steps": 805, "total_steps": 1230, "loss": 0.2349, "lr": 1.2867095896080607e-05, "epoch": 3.2678481012658227, "percentage": 65.45, "elapsed_time": "2:49:51", "remaining_time": "1:29:40"}
|
| 921 |
+
{"current_steps": 806, "total_steps": 1230, "loss": 0.2821, "lr": 1.2814098472037612e-05, "epoch": 3.271898734177215, "percentage": 65.53, "elapsed_time": "2:50:24", "remaining_time": "1:29:38"}
|
| 922 |
+
{"current_steps": 807, "total_steps": 1230, "loss": 0.2785, "lr": 1.276115892225764e-05, "epoch": 3.2759493670886077, "percentage": 65.61, "elapsed_time": "2:50:57", "remaining_time": "1:29:36"}
|
| 923 |
+
{"current_steps": 808, "total_steps": 1230, "loss": 0.2513, "lr": 1.2708277673108555e-05, "epoch": 3.2800000000000002, "percentage": 65.69, "elapsed_time": "2:51:31", "remaining_time": "1:29:34"}
|
| 924 |
+
{"current_steps": 809, "total_steps": 1230, "loss": 0.277, "lr": 1.2655455150488649e-05, "epoch": 3.2840506329113923, "percentage": 65.77, "elapsed_time": "2:52:05", "remaining_time": "1:29:33"}
|
| 925 |
+
{"current_steps": 810, "total_steps": 1230, "loss": 0.2694, "lr": 1.2602691779823272e-05, "epoch": 3.288101265822785, "percentage": 65.85, "elapsed_time": "2:52:40", "remaining_time": "1:29:32"}
|
| 926 |
+
{"current_steps": 811, "total_steps": 1230, "loss": 0.2695, "lr": 1.2549987986061355e-05, "epoch": 3.2921518987341774, "percentage": 65.93, "elapsed_time": "2:53:12", "remaining_time": "1:29:29"}
|
| 927 |
+
{"current_steps": 812, "total_steps": 1230, "loss": 0.2707, "lr": 1.2497344193672005e-05, "epoch": 3.2962025316455694, "percentage": 66.02, "elapsed_time": "2:53:45", "remaining_time": "1:29:26"}
|
| 928 |
+
{"current_steps": 813, "total_steps": 1230, "loss": 0.2349, "lr": 1.2444760826641092e-05, "epoch": 3.300253164556962, "percentage": 66.1, "elapsed_time": "2:54:15", "remaining_time": "1:29:22"}
|
| 929 |
+
{"current_steps": 814, "total_steps": 1230, "loss": 0.2457, "lr": 1.2392238308467817e-05, "epoch": 3.3043037974683545, "percentage": 66.18, "elapsed_time": "2:54:43", "remaining_time": "1:29:17"}
|
| 930 |
+
{"current_steps": 815, "total_steps": 1230, "loss": 0.2381, "lr": 1.2339777062161326e-05, "epoch": 3.308354430379747, "percentage": 66.26, "elapsed_time": "2:55:15", "remaining_time": "1:29:14"}
|
| 931 |
+
{"current_steps": 816, "total_steps": 1230, "loss": 0.2604, "lr": 1.2287377510237293e-05, "epoch": 3.3124050632911395, "percentage": 66.34, "elapsed_time": "2:55:52", "remaining_time": "1:29:13"}
|
| 932 |
+
{"current_steps": 817, "total_steps": 1230, "loss": 0.2551, "lr": 1.2235040074714488e-05, "epoch": 3.3164556962025316, "percentage": 66.42, "elapsed_time": "2:56:21", "remaining_time": "1:29:09"}
|
| 933 |
+
{"current_steps": 818, "total_steps": 1230, "loss": 0.2635, "lr": 1.2182765177111434e-05, "epoch": 3.320506329113924, "percentage": 66.5, "elapsed_time": "2:56:51", "remaining_time": "1:29:04"}
|
| 934 |
+
{"current_steps": 819, "total_steps": 1230, "loss": 0.2406, "lr": 1.213055323844297e-05, "epoch": 3.3245569620253166, "percentage": 66.59, "elapsed_time": "2:57:21", "remaining_time": "1:29:00"}
|
| 935 |
+
{"current_steps": 820, "total_steps": 1230, "loss": 0.2965, "lr": 1.2078404679216864e-05, "epoch": 3.3286075949367087, "percentage": 66.67, "elapsed_time": "2:57:57", "remaining_time": "1:28:58"}
|
| 936 |
+
{"current_steps": 821, "total_steps": 1230, "loss": 0.2779, "lr": 1.2026319919430458e-05, "epoch": 3.332658227848101, "percentage": 66.75, "elapsed_time": "2:58:27", "remaining_time": "1:28:54"}
|
| 937 |
+
{"current_steps": 822, "total_steps": 1230, "loss": 0.2658, "lr": 1.1974299378567227e-05, "epoch": 3.3367088607594937, "percentage": 66.83, "elapsed_time": "2:59:01", "remaining_time": "1:28:51"}
|
| 938 |
+
{"current_steps": 823, "total_steps": 1230, "loss": 0.2956, "lr": 1.1922343475593462e-05, "epoch": 3.340759493670886, "percentage": 66.91, "elapsed_time": "2:59:33", "remaining_time": "1:28:47"}
|
| 939 |
+
{"current_steps": 824, "total_steps": 1230, "loss": 0.2789, "lr": 1.187045262895488e-05, "epoch": 3.3448101265822787, "percentage": 66.99, "elapsed_time": "2:59:59", "remaining_time": "1:28:41"}
|
| 940 |
+
{"current_steps": 825, "total_steps": 1230, "loss": 0.2603, "lr": 1.1818627256573203e-05, "epoch": 3.348860759493671, "percentage": 67.07, "elapsed_time": "3:00:33", "remaining_time": "1:28:38"}
|
| 941 |
+
{"current_steps": 826, "total_steps": 1230, "loss": 0.2648, "lr": 1.1766867775842864e-05, "epoch": 3.3529113924050633, "percentage": 67.15, "elapsed_time": "3:01:09", "remaining_time": "1:28:36"}
|
| 942 |
+
{"current_steps": 827, "total_steps": 1230, "loss": 0.2441, "lr": 1.1715174603627615e-05, "epoch": 3.356962025316456, "percentage": 67.24, "elapsed_time": "3:01:44", "remaining_time": "1:28:33"}
|
| 943 |
+
{"current_steps": 828, "total_steps": 1230, "loss": 0.2797, "lr": 1.1663548156257147e-05, "epoch": 3.361012658227848, "percentage": 67.32, "elapsed_time": "3:02:21", "remaining_time": "1:28:31"}
|
| 944 |
+
{"current_steps": 829, "total_steps": 1230, "loss": 0.2516, "lr": 1.161198884952377e-05, "epoch": 3.3650632911392404, "percentage": 67.4, "elapsed_time": "3:02:49", "remaining_time": "1:28:25"}
|
| 945 |
+
{"current_steps": 830, "total_steps": 1230, "loss": 0.2557, "lr": 1.1560497098679056e-05, "epoch": 3.369113924050633, "percentage": 67.48, "elapsed_time": "3:03:17", "remaining_time": "1:28:20"}
|
| 946 |
+
{"current_steps": 831, "total_steps": 1230, "loss": 0.2642, "lr": 1.1509073318430479e-05, "epoch": 3.3731645569620254, "percentage": 67.56, "elapsed_time": "3:03:52", "remaining_time": "1:28:17"}
|
| 947 |
+
{"current_steps": 832, "total_steps": 1230, "loss": 0.2606, "lr": 1.1457717922938116e-05, "epoch": 3.377215189873418, "percentage": 67.64, "elapsed_time": "3:04:19", "remaining_time": "1:28:10"}
|
| 948 |
+
{"current_steps": 833, "total_steps": 1230, "loss": 0.2814, "lr": 1.1406431325811233e-05, "epoch": 3.38126582278481, "percentage": 67.72, "elapsed_time": "3:04:56", "remaining_time": "1:28:08"}
|
| 949 |
+
{"current_steps": 834, "total_steps": 1230, "loss": 0.2544, "lr": 1.135521394010506e-05, "epoch": 3.3853164556962025, "percentage": 67.8, "elapsed_time": "3:05:27", "remaining_time": "1:28:03"}
|
| 950 |
+
{"current_steps": 835, "total_steps": 1230, "loss": 0.255, "lr": 1.1304066178317367e-05, "epoch": 3.389367088607595, "percentage": 67.89, "elapsed_time": "3:05:56", "remaining_time": "1:27:57"}
|
| 951 |
+
{"current_steps": 836, "total_steps": 1230, "loss": 0.2536, "lr": 1.1252988452385199e-05, "epoch": 3.393417721518987, "percentage": 67.97, "elapsed_time": "3:06:29", "remaining_time": "1:27:53"}
|
| 952 |
+
{"current_steps": 837, "total_steps": 1230, "loss": 0.2749, "lr": 1.1201981173681536e-05, "epoch": 3.3974683544303796, "percentage": 68.05, "elapsed_time": "3:07:00", "remaining_time": "1:27:48"}
|
| 953 |
+
{"current_steps": 838, "total_steps": 1230, "loss": 0.2822, "lr": 1.1151044753011991e-05, "epoch": 3.401518987341772, "percentage": 68.13, "elapsed_time": "3:07:34", "remaining_time": "1:27:44"}
|
| 954 |
+
{"current_steps": 839, "total_steps": 1230, "loss": 0.2402, "lr": 1.1100179600611491e-05, "epoch": 3.4055696202531647, "percentage": 68.21, "elapsed_time": "3:08:00", "remaining_time": "1:27:37"}
|
| 955 |
+
{"current_steps": 840, "total_steps": 1230, "loss": 0.2589, "lr": 1.1049386126140985e-05, "epoch": 3.409620253164557, "percentage": 68.29, "elapsed_time": "3:08:31", "remaining_time": "1:27:31"}
|
| 956 |
+
{"current_steps": 841, "total_steps": 1230, "loss": 0.2486, "lr": 1.0998664738684128e-05, "epoch": 3.4136708860759493, "percentage": 68.37, "elapsed_time": "3:09:01", "remaining_time": "1:27:26"}
|
| 957 |
+
{"current_steps": 842, "total_steps": 1230, "loss": 0.2688, "lr": 1.0948015846744e-05, "epoch": 3.4177215189873418, "percentage": 68.46, "elapsed_time": "3:09:35", "remaining_time": "1:27:22"}
|
| 958 |
+
{"current_steps": 843, "total_steps": 1230, "loss": 0.2744, "lr": 1.0897439858239832e-05, "epoch": 3.4217721518987343, "percentage": 68.54, "elapsed_time": "3:10:10", "remaining_time": "1:27:18"}
|
| 959 |
+
{"current_steps": 844, "total_steps": 1230, "loss": 0.2546, "lr": 1.0846937180503652e-05, "epoch": 3.4258227848101264, "percentage": 68.62, "elapsed_time": "3:10:43", "remaining_time": "1:27:13"}
|
| 960 |
+
{"current_steps": 845, "total_steps": 1230, "loss": 0.2458, "lr": 1.0796508220277117e-05, "epoch": 3.429873417721519, "percentage": 68.7, "elapsed_time": "3:11:12", "remaining_time": "1:27:06"}
|
| 961 |
+
{"current_steps": 846, "total_steps": 1230, "loss": 0.2739, "lr": 1.0746153383708107e-05, "epoch": 3.4339240506329114, "percentage": 68.78, "elapsed_time": "3:11:50", "remaining_time": "1:27:04"}
|
| 962 |
+
{"current_steps": 847, "total_steps": 1230, "loss": 0.2607, "lr": 1.0695873076347579e-05, "epoch": 3.437974683544304, "percentage": 68.86, "elapsed_time": "3:12:24", "remaining_time": "1:27:00"}
|
| 963 |
+
{"current_steps": 848, "total_steps": 1230, "loss": 0.241, "lr": 1.0645667703146205e-05, "epoch": 3.4420253164556964, "percentage": 68.94, "elapsed_time": "3:12:50", "remaining_time": "1:26:52"}
|
| 964 |
+
{"current_steps": 849, "total_steps": 1230, "loss": 0.243, "lr": 1.0595537668451161e-05, "epoch": 3.4460759493670885, "percentage": 69.02, "elapsed_time": "3:13:24", "remaining_time": "1:26:47"}
|
| 965 |
+
{"current_steps": 850, "total_steps": 1230, "loss": 0.2615, "lr": 1.0545483376002854e-05, "epoch": 3.450126582278481, "percentage": 69.11, "elapsed_time": "3:13:54", "remaining_time": "1:26:41"}
|
| 966 |
+
{"current_steps": 851, "total_steps": 1230, "loss": 0.2358, "lr": 1.0495505228931676e-05, "epoch": 3.4541772151898735, "percentage": 69.19, "elapsed_time": "3:14:25", "remaining_time": "1:26:35"}
|
| 967 |
+
{"current_steps": 852, "total_steps": 1230, "loss": 0.2675, "lr": 1.044560362975474e-05, "epoch": 3.4582278481012656, "percentage": 69.27, "elapsed_time": "3:15:06", "remaining_time": "1:26:33"}
|
| 968 |
+
{"current_steps": 853, "total_steps": 1230, "loss": 0.2547, "lr": 1.0395778980372695e-05, "epoch": 3.462278481012658, "percentage": 69.35, "elapsed_time": "3:15:38", "remaining_time": "1:26:27"}
|
| 969 |
+
{"current_steps": 854, "total_steps": 1230, "loss": 0.2873, "lr": 1.0346031682066381e-05, "epoch": 3.4663291139240506, "percentage": 69.43, "elapsed_time": "3:16:13", "remaining_time": "1:26:23"}
|
| 970 |
+
{"current_steps": 855, "total_steps": 1230, "loss": 0.2638, "lr": 1.0296362135493724e-05, "epoch": 3.470379746835443, "percentage": 69.51, "elapsed_time": "3:16:43", "remaining_time": "1:26:16"}
|
| 971 |
+
{"current_steps": 856, "total_steps": 1230, "loss": 0.2733, "lr": 1.0246770740686422e-05, "epoch": 3.4744303797468357, "percentage": 69.59, "elapsed_time": "3:17:17", "remaining_time": "1:26:12"}
|
| 972 |
+
{"current_steps": 857, "total_steps": 1230, "loss": 0.2526, "lr": 1.0197257897046743e-05, "epoch": 3.4784810126582277, "percentage": 69.67, "elapsed_time": "3:17:44", "remaining_time": "1:26:04"}
|
| 973 |
+
{"current_steps": 858, "total_steps": 1230, "loss": 0.2546, "lr": 1.014782400334433e-05, "epoch": 3.4825316455696202, "percentage": 69.76, "elapsed_time": "3:18:17", "remaining_time": "1:25:58"}
|
| 974 |
+
{"current_steps": 859, "total_steps": 1230, "loss": 0.264, "lr": 1.009846945771296e-05, "epoch": 3.4865822784810128, "percentage": 69.84, "elapsed_time": "3:18:46", "remaining_time": "1:25:51"}
|
| 975 |
+
{"current_steps": 860, "total_steps": 1230, "loss": 0.2339, "lr": 1.0049194657647363e-05, "epoch": 3.490632911392405, "percentage": 69.92, "elapsed_time": "3:19:14", "remaining_time": "1:25:43"}
|
| 976 |
+
{"current_steps": 861, "total_steps": 1230, "loss": 0.2369, "lr": 1.0000000000000006e-05, "epoch": 3.4946835443037974, "percentage": 70.0, "elapsed_time": "3:19:41", "remaining_time": "1:25:34"}
|
| 977 |
+
{"current_steps": 862, "total_steps": 1230, "loss": 0.2472, "lr": 9.950885880977891e-06, "epoch": 3.49873417721519, "percentage": 70.08, "elapsed_time": "3:20:13", "remaining_time": "1:25:28"}
|
| 978 |
+
{"current_steps": 863, "total_steps": 1230, "loss": 0.2847, "lr": 9.901852696139382e-06, "epoch": 3.5027848101265824, "percentage": 70.16, "elapsed_time": "3:20:49", "remaining_time": "1:25:24"}
|
| 979 |
+
{"current_steps": 864, "total_steps": 1230, "loss": 0.2897, "lr": 9.852900840391027e-06, "epoch": 3.506835443037975, "percentage": 70.24, "elapsed_time": "3:21:19", "remaining_time": "1:25:17"}
|
| 980 |
+
{"current_steps": 865, "total_steps": 1230, "loss": 0.2555, "lr": 9.804030707984313e-06, "epoch": 3.510886075949367, "percentage": 70.33, "elapsed_time": "3:21:54", "remaining_time": "1:25:12"}
|
| 981 |
+
{"current_steps": 866, "total_steps": 1230, "loss": 0.2479, "lr": 9.755242692512599e-06, "epoch": 3.5149367088607595, "percentage": 70.41, "elapsed_time": "3:22:25", "remaining_time": "1:25:05"}
|
| 982 |
+
{"current_steps": 867, "total_steps": 1230, "loss": 0.2808, "lr": 9.70653718690782e-06, "epoch": 3.518987341772152, "percentage": 70.49, "elapsed_time": "3:23:00", "remaining_time": "1:24:59"}
|
| 983 |
+
{"current_steps": 868, "total_steps": 1230, "loss": 0.2276, "lr": 9.657914583437454e-06, "epoch": 3.523037974683544, "percentage": 70.57, "elapsed_time": "3:23:34", "remaining_time": "1:24:53"}
|
| 984 |
+
{"current_steps": 869, "total_steps": 1230, "loss": 0.2601, "lr": 9.609375273701246e-06, "epoch": 3.5270886075949366, "percentage": 70.65, "elapsed_time": "3:24:10", "remaining_time": "1:24:49"}
|
| 985 |
+
{"current_steps": 870, "total_steps": 1230, "loss": 0.2401, "lr": 9.560919648628133e-06, "epoch": 3.531139240506329, "percentage": 70.73, "elapsed_time": "3:24:39", "remaining_time": "1:24:41"}
|
| 986 |
+
{"current_steps": 871, "total_steps": 1230, "loss": 0.2466, "lr": 9.512548098473047e-06, "epoch": 3.5351898734177216, "percentage": 70.81, "elapsed_time": "3:25:09", "remaining_time": "1:24:33"}
|
| 987 |
+
{"current_steps": 872, "total_steps": 1230, "loss": 0.2763, "lr": 9.464261012813825e-06, "epoch": 3.539240506329114, "percentage": 70.89, "elapsed_time": "3:25:42", "remaining_time": "1:24:27"}
|
| 988 |
+
{"current_steps": 873, "total_steps": 1230, "loss": 0.405, "lr": 9.416058780547987e-06, "epoch": 3.543291139240506, "percentage": 70.98, "elapsed_time": "3:26:16", "remaining_time": "1:24:21"}
|
| 989 |
+
{"current_steps": 874, "total_steps": 1230, "loss": 0.2442, "lr": 9.367941789889714e-06, "epoch": 3.5473417721518987, "percentage": 71.06, "elapsed_time": "3:26:45", "remaining_time": "1:24:13"}
|
| 990 |
+
{"current_steps": 875, "total_steps": 1230, "loss": 0.265, "lr": 9.319910428366607e-06, "epoch": 3.5513924050632912, "percentage": 71.14, "elapsed_time": "3:27:14", "remaining_time": "1:24:04"}
|
| 991 |
+
{"current_steps": 876, "total_steps": 1230, "loss": 0.248, "lr": 9.271965082816667e-06, "epoch": 3.5554430379746833, "percentage": 71.22, "elapsed_time": "3:27:43", "remaining_time": "1:23:56"}
|
| 992 |
+
{"current_steps": 877, "total_steps": 1230, "loss": 0.2418, "lr": 9.224106139385111e-06, "epoch": 3.559493670886076, "percentage": 71.3, "elapsed_time": "3:28:09", "remaining_time": "1:23:47"}
|
| 993 |
+
{"current_steps": 878, "total_steps": 1230, "loss": 0.2603, "lr": 9.176333983521291e-06, "epoch": 3.5635443037974683, "percentage": 71.38, "elapsed_time": "3:28:42", "remaining_time": "1:23:40"}
|
| 994 |
+
{"current_steps": 879, "total_steps": 1230, "loss": 0.2409, "lr": 9.12864899997558e-06, "epoch": 3.567594936708861, "percentage": 71.46, "elapsed_time": "3:29:14", "remaining_time": "1:23:33"}
|
| 995 |
+
{"current_steps": 880, "total_steps": 1230, "loss": 0.256, "lr": 9.08105157279628e-06, "epoch": 3.5716455696202534, "percentage": 71.54, "elapsed_time": "3:29:45", "remaining_time": "1:23:25"}
|
| 996 |
+
{"current_steps": 881, "total_steps": 1230, "loss": 0.2775, "lr": 9.03354208532653e-06, "epoch": 3.5756962025316454, "percentage": 71.63, "elapsed_time": "3:30:09", "remaining_time": "1:23:15"}
|
| 997 |
+
{"current_steps": 882, "total_steps": 1230, "loss": 0.2466, "lr": 8.986120920201205e-06, "epoch": 3.579746835443038, "percentage": 71.71, "elapsed_time": "3:30:41", "remaining_time": "1:23:07"}
|
| 998 |
+
{"current_steps": 883, "total_steps": 1230, "loss": 0.2562, "lr": 8.938788459343852e-06, "epoch": 3.5837974683544305, "percentage": 71.79, "elapsed_time": "3:31:12", "remaining_time": "1:22:59"}
|
| 999 |
+
{"current_steps": 884, "total_steps": 1230, "loss": 0.2469, "lr": 8.8915450839636e-06, "epoch": 3.5878481012658225, "percentage": 71.87, "elapsed_time": "3:31:42", "remaining_time": "1:22:51"}
|
| 1000 |
+
{"current_steps": 885, "total_steps": 1230, "loss": 0.2474, "lr": 8.844391174552116e-06, "epoch": 3.591898734177215, "percentage": 71.95, "elapsed_time": "3:32:15", "remaining_time": "1:22:44"}
|
| 1001 |
+
{"current_steps": 886, "total_steps": 1230, "loss": 0.2795, "lr": 8.797327110880479e-06, "epoch": 3.5959493670886076, "percentage": 72.03, "elapsed_time": "3:32:49", "remaining_time": "1:22:38"}
|
| 1002 |
+
{"current_steps": 887, "total_steps": 1230, "loss": 0.2505, "lr": 8.750353271996206e-06, "epoch": 3.6, "percentage": 72.11, "elapsed_time": "3:33:26", "remaining_time": "1:22:32"}
|
| 1003 |
+
{"current_steps": 888, "total_steps": 1230, "loss": 0.2384, "lr": 8.703470036220132e-06, "epoch": 3.6040506329113926, "percentage": 72.2, "elapsed_time": "3:33:52", "remaining_time": "1:22:22"}
|
| 1004 |
+
{"current_steps": 889, "total_steps": 1230, "loss": 0.2479, "lr": 8.656677781143394e-06, "epoch": 3.6081012658227847, "percentage": 72.28, "elapsed_time": "3:34:22", "remaining_time": "1:22:13"}
|
| 1005 |
+
{"current_steps": 890, "total_steps": 1230, "loss": 0.2444, "lr": 8.609976883624377e-06, "epoch": 3.612151898734177, "percentage": 72.36, "elapsed_time": "3:34:56", "remaining_time": "1:22:06"}
|
| 1006 |
+
{"current_steps": 891, "total_steps": 1230, "loss": 0.2577, "lr": 8.563367719785698e-06, "epoch": 3.6162025316455697, "percentage": 72.44, "elapsed_time": "3:35:31", "remaining_time": "1:22:00"}
|
| 1007 |
+
{"current_steps": 892, "total_steps": 1230, "loss": 0.2468, "lr": 8.516850665011138e-06, "epoch": 3.620253164556962, "percentage": 72.52, "elapsed_time": "3:36:03", "remaining_time": "1:21:52"}
|
| 1008 |
+
{"current_steps": 893, "total_steps": 1230, "loss": 0.2737, "lr": 8.47042609394269e-06, "epoch": 3.6243037974683543, "percentage": 72.6, "elapsed_time": "3:36:39", "remaining_time": "1:21:45"}
|
| 1009 |
+
{"current_steps": 894, "total_steps": 1230, "loss": 0.2607, "lr": 8.424094380477432e-06, "epoch": 3.628354430379747, "percentage": 72.68, "elapsed_time": "3:37:17", "remaining_time": "1:21:39"}
|
| 1010 |
+
{"current_steps": 895, "total_steps": 1230, "loss": 0.2693, "lr": 8.37785589776465e-06, "epoch": 3.6324050632911393, "percentage": 72.76, "elapsed_time": "3:37:52", "remaining_time": "1:21:33"}
|
| 1011 |
+
{"current_steps": 896, "total_steps": 1230, "loss": 0.2604, "lr": 8.331711018202694e-06, "epoch": 3.636455696202532, "percentage": 72.85, "elapsed_time": "3:38:22", "remaining_time": "1:21:24"}
|
| 1012 |
+
{"current_steps": 897, "total_steps": 1230, "loss": 0.2544, "lr": 8.285660113436104e-06, "epoch": 3.640506329113924, "percentage": 72.93, "elapsed_time": "3:38:59", "remaining_time": "1:21:17"}
|
| 1013 |
+
{"current_steps": 898, "total_steps": 1230, "loss": 0.2615, "lr": 8.239703554352527e-06, "epoch": 3.6445569620253164, "percentage": 73.01, "elapsed_time": "3:39:30", "remaining_time": "1:21:09"}
|
| 1014 |
+
{"current_steps": 899, "total_steps": 1230, "loss": 0.2687, "lr": 8.193841711079775e-06, "epoch": 3.648607594936709, "percentage": 73.09, "elapsed_time": "3:40:01", "remaining_time": "1:21:00"}
|
| 1015 |
+
{"current_steps": 900, "total_steps": 1230, "loss": 0.2717, "lr": 8.148074952982828e-06, "epoch": 3.652658227848101, "percentage": 73.17, "elapsed_time": "3:40:28", "remaining_time": "1:20:50"}
|
| 1016 |
+
{"current_steps": 901, "total_steps": 1230, "loss": 0.2724, "lr": 8.102403648660859e-06, "epoch": 3.6567088607594935, "percentage": 73.25, "elapsed_time": "3:40:59", "remaining_time": "1:20:41"}
|
| 1017 |
+
{"current_steps": 902, "total_steps": 1230, "loss": 0.2709, "lr": 8.056828165944282e-06, "epoch": 3.660759493670886, "percentage": 73.33, "elapsed_time": "3:41:29", "remaining_time": "1:20:32"}
|
| 1018 |
+
{"current_steps": 903, "total_steps": 1230, "loss": 0.2665, "lr": 8.011348871891762e-06, "epoch": 3.6648101265822786, "percentage": 73.41, "elapsed_time": "3:42:05", "remaining_time": "1:20:25"}
|
| 1019 |
+
{"current_steps": 904, "total_steps": 1230, "loss": 0.2449, "lr": 7.965966132787287e-06, "epoch": 3.668860759493671, "percentage": 73.5, "elapsed_time": "3:42:44", "remaining_time": "1:20:19"}
|
| 1020 |
+
{"current_steps": 905, "total_steps": 1230, "loss": 0.2705, "lr": 7.920680314137189e-06, "epoch": 3.672911392405063, "percentage": 73.58, "elapsed_time": "3:43:13", "remaining_time": "1:20:09"}
|
| 1021 |
+
{"current_steps": 906, "total_steps": 1230, "loss": 0.2593, "lr": 7.875491780667246e-06, "epoch": 3.6769620253164557, "percentage": 73.66, "elapsed_time": "3:43:48", "remaining_time": "1:20:02"}
|
| 1022 |
+
{"current_steps": 907, "total_steps": 1230, "loss": 0.2744, "lr": 7.830400896319667e-06, "epoch": 3.681012658227848, "percentage": 73.74, "elapsed_time": "3:44:13", "remaining_time": "1:19:51"}
|
| 1023 |
+
{"current_steps": 908, "total_steps": 1230, "loss": 0.2722, "lr": 7.785408024250259e-06, "epoch": 3.6850632911392402, "percentage": 73.82, "elapsed_time": "3:44:49", "remaining_time": "1:19:43"}
|
| 1024 |
+
{"current_steps": 909, "total_steps": 1230, "loss": 0.2406, "lr": 7.74051352682542e-06, "epoch": 3.6891139240506328, "percentage": 73.9, "elapsed_time": "3:45:20", "remaining_time": "1:19:34"}
|
| 1025 |
+
{"current_steps": 910, "total_steps": 1230, "loss": 0.2715, "lr": 7.695717765619257e-06, "epoch": 3.6931645569620253, "percentage": 73.98, "elapsed_time": "3:45:54", "remaining_time": "1:19:26"}
|
| 1026 |
+
{"current_steps": 911, "total_steps": 1230, "loss": 0.28, "lr": 7.651021101410673e-06, "epoch": 3.697215189873418, "percentage": 74.07, "elapsed_time": "3:46:27", "remaining_time": "1:19:17"}
|
| 1027 |
+
{"current_steps": 912, "total_steps": 1230, "loss": 0.2798, "lr": 7.606423894180464e-06, "epoch": 3.7012658227848103, "percentage": 74.15, "elapsed_time": "3:47:06", "remaining_time": "1:19:11"}
|
| 1028 |
+
{"current_steps": 913, "total_steps": 1230, "loss": 0.2754, "lr": 7.56192650310839e-06, "epoch": 3.7053164556962024, "percentage": 74.23, "elapsed_time": "3:47:43", "remaining_time": "1:19:03"}
|
| 1029 |
+
{"current_steps": 914, "total_steps": 1230, "loss": 0.254, "lr": 7.517529286570349e-06, "epoch": 3.709367088607595, "percentage": 74.31, "elapsed_time": "3:48:18", "remaining_time": "1:18:56"}
|
| 1030 |
+
{"current_steps": 915, "total_steps": 1230, "loss": 0.253, "lr": 7.473232602135387e-06, "epoch": 3.7134177215189874, "percentage": 74.39, "elapsed_time": "3:48:52", "remaining_time": "1:18:47"}
|
| 1031 |
+
{"current_steps": 916, "total_steps": 1230, "loss": 0.2606, "lr": 7.429036806562935e-06, "epoch": 3.7174683544303795, "percentage": 74.47, "elapsed_time": "3:49:27", "remaining_time": "1:18:39"}
|
| 1032 |
+
{"current_steps": 917, "total_steps": 1230, "loss": 0.2563, "lr": 7.3849422557998455e-06, "epoch": 3.721518987341772, "percentage": 74.55, "elapsed_time": "3:50:00", "remaining_time": "1:18:30"}
|
| 1033 |
+
{"current_steps": 918, "total_steps": 1230, "loss": 0.2714, "lr": 7.340949304977567e-06, "epoch": 3.7255696202531645, "percentage": 74.63, "elapsed_time": "3:50:33", "remaining_time": "1:18:21"}
|
| 1034 |
+
{"current_steps": 919, "total_steps": 1230, "loss": 0.2639, "lr": 7.297058308409282e-06, "epoch": 3.729620253164557, "percentage": 74.72, "elapsed_time": "3:51:04", "remaining_time": "1:18:11"}
|
| 1035 |
+
{"current_steps": 920, "total_steps": 1230, "loss": 0.2662, "lr": 7.25326961958704e-06, "epoch": 3.7336708860759495, "percentage": 74.8, "elapsed_time": "3:51:35", "remaining_time": "1:18:02"}
|
| 1036 |
+
{"current_steps": 921, "total_steps": 1230, "loss": 0.2721, "lr": 7.209583591178921e-06, "epoch": 3.7377215189873416, "percentage": 74.88, "elapsed_time": "3:52:06", "remaining_time": "1:17:52"}
|
| 1037 |
+
{"current_steps": 922, "total_steps": 1230, "loss": 0.2346, "lr": 7.1660005750261925e-06, "epoch": 3.741772151898734, "percentage": 74.96, "elapsed_time": "3:52:31", "remaining_time": "1:17:40"}
|
| 1038 |
+
{"current_steps": 923, "total_steps": 1230, "loss": 0.2533, "lr": 7.1225209221404765e-06, "epoch": 3.7458227848101266, "percentage": 75.04, "elapsed_time": "3:53:02", "remaining_time": "1:17:30"}
|
| 1039 |
+
{"current_steps": 924, "total_steps": 1230, "loss": 0.2515, "lr": 7.079144982700909e-06, "epoch": 3.7498734177215187, "percentage": 75.12, "elapsed_time": "3:53:33", "remaining_time": "1:17:20"}
|
| 1040 |
+
{"current_steps": 925, "total_steps": 1230, "loss": 0.2828, "lr": 7.0358731060513695e-06, "epoch": 3.7539240506329112, "percentage": 75.2, "elapsed_time": "3:54:10", "remaining_time": "1:17:12"}
|
| 1041 |
+
{"current_steps": 926, "total_steps": 1230, "loss": 0.2415, "lr": 6.99270564069757e-06, "epoch": 3.7579746835443038, "percentage": 75.28, "elapsed_time": "3:54:38", "remaining_time": "1:17:01"}
|
| 1042 |
+
{"current_steps": 927, "total_steps": 1230, "loss": 0.2622, "lr": 6.949642934304375e-06, "epoch": 3.7620253164556963, "percentage": 75.37, "elapsed_time": "3:55:05", "remaining_time": "1:16:50"}
|
| 1043 |
+
{"current_steps": 928, "total_steps": 1230, "loss": 0.2522, "lr": 6.906685333692871e-06, "epoch": 3.766075949367089, "percentage": 75.45, "elapsed_time": "3:55:40", "remaining_time": "1:16:41"}
|
| 1044 |
+
{"current_steps": 929, "total_steps": 1230, "loss": 0.2538, "lr": 6.86383318483769e-06, "epoch": 3.770126582278481, "percentage": 75.53, "elapsed_time": "3:56:11", "remaining_time": "1:16:31"}
|
| 1045 |
+
{"current_steps": 930, "total_steps": 1230, "loss": 0.2522, "lr": 6.821086832864139e-06, "epoch": 3.7741772151898734, "percentage": 75.61, "elapsed_time": "3:56:38", "remaining_time": "1:16:20"}
|
| 1046 |
+
{"current_steps": 931, "total_steps": 1230, "loss": 0.2678, "lr": 6.77844662204546e-06, "epoch": 3.778227848101266, "percentage": 75.69, "elapsed_time": "3:57:08", "remaining_time": "1:16:09"}
|
| 1047 |
+
{"current_steps": 932, "total_steps": 1230, "loss": 0.2559, "lr": 6.7359128958000455e-06, "epoch": 3.782278481012658, "percentage": 75.77, "elapsed_time": "3:57:43", "remaining_time": "1:16:00"}
|
| 1048 |
+
{"current_steps": 933, "total_steps": 1230, "loss": 0.2642, "lr": 6.693485996688695e-06, "epoch": 3.7863291139240505, "percentage": 75.85, "elapsed_time": "3:58:22", "remaining_time": "1:15:52"}
|
| 1049 |
+
{"current_steps": 934, "total_steps": 1230, "loss": 0.2557, "lr": 6.651166266411801e-06, "epoch": 3.790379746835443, "percentage": 75.93, "elapsed_time": "3:58:55", "remaining_time": "1:15:43"}
|
| 1050 |
+
{"current_steps": 935, "total_steps": 1230, "loss": 0.2755, "lr": 6.6089540458066725e-06, "epoch": 3.7944303797468355, "percentage": 76.02, "elapsed_time": "3:59:24", "remaining_time": "1:15:32"}
|
| 1051 |
+
{"current_steps": 936, "total_steps": 1230, "loss": 0.2405, "lr": 6.566849674844711e-06, "epoch": 3.798481012658228, "percentage": 76.1, "elapsed_time": "3:59:55", "remaining_time": "1:15:21"}
|
| 1052 |
+
{"current_steps": 937, "total_steps": 1230, "loss": 0.2364, "lr": 6.524853492628747e-06, "epoch": 3.80253164556962, "percentage": 76.18, "elapsed_time": "4:00:28", "remaining_time": "1:15:11"}
|
| 1053 |
+
{"current_steps": 938, "total_steps": 1230, "loss": 0.2644, "lr": 6.4829658373902536e-06, "epoch": 3.8065822784810126, "percentage": 76.26, "elapsed_time": "4:00:56", "remaining_time": "1:15:00"}
|
| 1054 |
+
{"current_steps": 939, "total_steps": 1230, "loss": 0.244, "lr": 6.441187046486648e-06, "epoch": 3.810632911392405, "percentage": 76.34, "elapsed_time": "4:01:27", "remaining_time": "1:14:49"}
|
| 1055 |
+
{"current_steps": 940, "total_steps": 1230, "loss": 0.2422, "lr": 6.399517456398567e-06, "epoch": 3.814683544303797, "percentage": 76.42, "elapsed_time": "4:01:55", "remaining_time": "1:14:38"}
|
| 1056 |
+
{"current_steps": 941, "total_steps": 1230, "loss": 0.2479, "lr": 6.357957402727164e-06, "epoch": 3.81873417721519, "percentage": 76.5, "elapsed_time": "4:02:25", "remaining_time": "1:14:27"}
|
| 1057 |
+
{"current_steps": 942, "total_steps": 1230, "loss": 0.2592, "lr": 6.316507220191395e-06, "epoch": 3.8227848101265822, "percentage": 76.59, "elapsed_time": "4:03:02", "remaining_time": "1:14:18"}
|
| 1058 |
+
{"current_steps": 943, "total_steps": 1230, "loss": 0.2515, "lr": 6.275167242625331e-06, "epoch": 3.8268354430379747, "percentage": 76.67, "elapsed_time": "4:03:31", "remaining_time": "1:14:07"}
|
| 1059 |
+
{"current_steps": 944, "total_steps": 1230, "loss": 0.2594, "lr": 6.233937802975471e-06, "epoch": 3.8308860759493673, "percentage": 76.75, "elapsed_time": "4:04:10", "remaining_time": "1:13:58"}
|
| 1060 |
+
{"current_steps": 945, "total_steps": 1230, "loss": 0.2705, "lr": 6.192819233298046e-06, "epoch": 3.8349367088607593, "percentage": 76.83, "elapsed_time": "4:04:42", "remaining_time": "1:13:48"}
|
| 1061 |
+
{"current_steps": 946, "total_steps": 1230, "loss": 0.2649, "lr": 6.151811864756383e-06, "epoch": 3.838987341772152, "percentage": 76.91, "elapsed_time": "4:05:15", "remaining_time": "1:13:37"}
|
| 1062 |
+
{"current_steps": 947, "total_steps": 1230, "loss": 0.2342, "lr": 6.1109160276181655e-06, "epoch": 3.8430379746835444, "percentage": 76.99, "elapsed_time": "4:05:47", "remaining_time": "1:13:27"}
|
| 1063 |
+
{"current_steps": 948, "total_steps": 1230, "loss": 0.265, "lr": 6.070132051252868e-06, "epoch": 3.847088607594937, "percentage": 77.07, "elapsed_time": "4:06:18", "remaining_time": "1:13:16"}
|
| 1064 |
+
{"current_steps": 949, "total_steps": 1230, "loss": 0.2619, "lr": 6.0294602641290034e-06, "epoch": 3.8511392405063294, "percentage": 77.15, "elapsed_time": "4:06:51", "remaining_time": "1:13:05"}
|
| 1065 |
+
{"current_steps": 950, "total_steps": 1230, "loss": 0.2808, "lr": 5.988900993811575e-06, "epoch": 3.8551898734177215, "percentage": 77.24, "elapsed_time": "4:07:24", "remaining_time": "1:12:55"}
|
| 1066 |
+
{"current_steps": 951, "total_steps": 1230, "loss": 0.2531, "lr": 5.948454566959363e-06, "epoch": 3.859240506329114, "percentage": 77.32, "elapsed_time": "4:07:58", "remaining_time": "1:12:44"}
|
| 1067 |
+
{"current_steps": 952, "total_steps": 1230, "loss": 0.2519, "lr": 5.908121309322328e-06, "epoch": 3.8632911392405065, "percentage": 77.4, "elapsed_time": "4:08:24", "remaining_time": "1:12:32"}
|
| 1068 |
+
{"current_steps": 953, "total_steps": 1230, "loss": 0.2517, "lr": 5.867901545738976e-06, "epoch": 3.8673417721518986, "percentage": 77.48, "elapsed_time": "4:08:56", "remaining_time": "1:12:21"}
|
| 1069 |
+
{"current_steps": 954, "total_steps": 1230, "loss": 0.2687, "lr": 5.827795600133774e-06, "epoch": 3.871392405063291, "percentage": 77.56, "elapsed_time": "4:09:27", "remaining_time": "1:12:10"}
|
| 1070 |
+
{"current_steps": 955, "total_steps": 1230, "loss": 0.261, "lr": 5.787803795514466e-06, "epoch": 3.8754430379746836, "percentage": 77.64, "elapsed_time": "4:10:01", "remaining_time": "1:11:59"}
|
| 1071 |
+
{"current_steps": 956, "total_steps": 1230, "loss": 0.2542, "lr": 5.747926453969576e-06, "epoch": 3.879493670886076, "percentage": 77.72, "elapsed_time": "4:10:33", "remaining_time": "1:11:48"}
|
| 1072 |
+
{"current_steps": 957, "total_steps": 1230, "loss": 0.2648, "lr": 5.708163896665708e-06, "epoch": 3.8835443037974686, "percentage": 77.8, "elapsed_time": "4:11:09", "remaining_time": "1:11:38"}
|
| 1073 |
+
{"current_steps": 958, "total_steps": 1230, "loss": 0.2771, "lr": 5.668516443845047e-06, "epoch": 3.8875949367088607, "percentage": 77.89, "elapsed_time": "4:11:41", "remaining_time": "1:11:27"}
|
| 1074 |
+
{"current_steps": 959, "total_steps": 1230, "loss": 0.2554, "lr": 5.6289844148227225e-06, "epoch": 3.891645569620253, "percentage": 77.97, "elapsed_time": "4:12:19", "remaining_time": "1:11:18"}
|
| 1075 |
+
{"current_steps": 960, "total_steps": 1230, "loss": 0.2726, "lr": 5.5895681279842615e-06, "epoch": 3.8956962025316457, "percentage": 78.05, "elapsed_time": "4:12:49", "remaining_time": "1:11:06"}
|
| 1076 |
+
{"current_steps": 961, "total_steps": 1230, "loss": 0.255, "lr": 5.550267900783019e-06, "epoch": 3.899746835443038, "percentage": 78.13, "elapsed_time": "4:13:21", "remaining_time": "1:10:55"}
|
| 1077 |
+
{"current_steps": 962, "total_steps": 1230, "loss": 0.2592, "lr": 5.511084049737623e-06, "epoch": 3.9037974683544303, "percentage": 78.21, "elapsed_time": "4:13:55", "remaining_time": "1:10:44"}
|
| 1078 |
+
{"current_steps": 963, "total_steps": 1230, "loss": 0.2348, "lr": 5.4720168904294215e-06, "epoch": 3.907848101265823, "percentage": 78.29, "elapsed_time": "4:14:32", "remaining_time": "1:10:34"}
|
| 1079 |
+
{"current_steps": 964, "total_steps": 1230, "loss": 0.2481, "lr": 5.433066737499948e-06, "epoch": 3.9118987341772153, "percentage": 78.37, "elapsed_time": "4:15:01", "remaining_time": "1:10:22"}
|
| 1080 |
+
{"current_steps": 965, "total_steps": 1230, "loss": 0.2492, "lr": 5.394233904648376e-06, "epoch": 3.915949367088608, "percentage": 78.46, "elapsed_time": "4:15:36", "remaining_time": "1:10:11"}
|
| 1081 |
+
{"current_steps": 966, "total_steps": 1230, "loss": 0.256, "lr": 5.355518704628997e-06, "epoch": 3.92, "percentage": 78.54, "elapsed_time": "4:16:05", "remaining_time": "1:09:59"}
|
| 1082 |
+
{"current_steps": 967, "total_steps": 1230, "loss": 0.2667, "lr": 5.316921449248731e-06, "epoch": 3.9240506329113924, "percentage": 78.62, "elapsed_time": "4:16:37", "remaining_time": "1:09:47"}
|
| 1083 |
+
{"current_steps": 968, "total_steps": 1230, "loss": 0.2571, "lr": 5.278442449364538e-06, "epoch": 3.928101265822785, "percentage": 78.7, "elapsed_time": "4:17:09", "remaining_time": "1:09:36"}
|
| 1084 |
+
{"current_steps": 969, "total_steps": 1230, "loss": 0.2349, "lr": 5.240082014881016e-06, "epoch": 3.932151898734177, "percentage": 78.78, "elapsed_time": "4:17:42", "remaining_time": "1:09:24"}
|
| 1085 |
+
{"current_steps": 970, "total_steps": 1230, "loss": 0.2798, "lr": 5.201840454747822e-06, "epoch": 3.9362025316455695, "percentage": 78.86, "elapsed_time": "4:18:18", "remaining_time": "1:09:14"}
|
| 1086 |
+
{"current_steps": 971, "total_steps": 1230, "loss": 0.2438, "lr": 5.163718076957223e-06, "epoch": 3.940253164556962, "percentage": 78.94, "elapsed_time": "4:18:54", "remaining_time": "1:09:03"}
|
| 1087 |
+
{"current_steps": 972, "total_steps": 1230, "loss": 0.2418, "lr": 5.125715188541609e-06, "epoch": 3.9443037974683546, "percentage": 79.02, "elapsed_time": "4:19:26", "remaining_time": "1:08:51"}
|
| 1088 |
+
{"current_steps": 973, "total_steps": 1230, "loss": 0.2817, "lr": 5.087832095571021e-06, "epoch": 3.948354430379747, "percentage": 79.11, "elapsed_time": "4:19:58", "remaining_time": "1:08:40"}
|
| 1089 |
+
{"current_steps": 974, "total_steps": 1230, "loss": 0.2433, "lr": 5.0500691031506766e-06, "epoch": 3.952405063291139, "percentage": 79.19, "elapsed_time": "4:20:26", "remaining_time": "1:08:27"}
|
| 1090 |
+
{"current_steps": 975, "total_steps": 1230, "loss": 0.2624, "lr": 5.01242651541854e-06, "epoch": 3.9564556962025317, "percentage": 79.27, "elapsed_time": "4:21:02", "remaining_time": "1:08:16"}
|
| 1091 |
+
{"current_steps": 976, "total_steps": 1230, "loss": 0.266, "lr": 4.974904635542815e-06, "epoch": 3.960506329113924, "percentage": 79.35, "elapsed_time": "4:21:35", "remaining_time": "1:08:04"}
|
| 1092 |
+
{"current_steps": 977, "total_steps": 1230, "loss": 0.2485, "lr": 4.937503765719582e-06, "epoch": 3.9645569620253163, "percentage": 79.43, "elapsed_time": "4:22:08", "remaining_time": "1:07:53"}
|
| 1093 |
+
{"current_steps": 978, "total_steps": 1230, "loss": 0.2518, "lr": 4.900224207170299e-06, "epoch": 3.968607594936709, "percentage": 79.51, "elapsed_time": "4:22:43", "remaining_time": "1:07:41"}
|
| 1094 |
+
{"current_steps": 979, "total_steps": 1230, "loss": 0.2708, "lr": 4.8630662601394065e-06, "epoch": 3.9726582278481013, "percentage": 79.59, "elapsed_time": "4:23:11", "remaining_time": "1:07:28"}
|
| 1095 |
+
{"current_steps": 980, "total_steps": 1230, "loss": 0.2436, "lr": 4.8260302238918995e-06, "epoch": 3.976708860759494, "percentage": 79.67, "elapsed_time": "4:23:43", "remaining_time": "1:07:16"}
|
| 1096 |
+
{"current_steps": 981, "total_steps": 1230, "loss": 0.2598, "lr": 4.789116396710924e-06, "epoch": 3.9807594936708863, "percentage": 79.76, "elapsed_time": "4:24:18", "remaining_time": "1:07:05"}
|
| 1097 |
+
{"current_steps": 982, "total_steps": 1230, "loss": 0.2472, "lr": 4.752325075895368e-06, "epoch": 3.9848101265822784, "percentage": 79.84, "elapsed_time": "4:24:46", "remaining_time": "1:06:52"}
|
| 1098 |
+
{"current_steps": 983, "total_steps": 1230, "loss": 0.2535, "lr": 4.715656557757473e-06, "epoch": 3.988860759493671, "percentage": 79.92, "elapsed_time": "4:25:25", "remaining_time": "1:06:41"}
|
| 1099 |
+
{"current_steps": 984, "total_steps": 1230, "loss": 0.2712, "lr": 4.679111137620442e-06, "epoch": 3.9929113924050634, "percentage": 80.0, "elapsed_time": "4:25:54", "remaining_time": "1:06:28"}
|
| 1100 |
+
{"current_steps": 985, "total_steps": 1230, "loss": 0.2712, "lr": 4.6426891098160585e-06, "epoch": 3.9969620253164555, "percentage": 80.08, "elapsed_time": "4:26:26", "remaining_time": "1:06:16"}
|
| 1101 |
+
{"current_steps": 986, "total_steps": 1230, "loss": 0.2612, "lr": 4.6063907676823474e-06, "epoch": 4.0010126582278485, "percentage": 80.16, "elapsed_time": "4:29:35", "remaining_time": "1:06:42"}
|
| 1102 |
+
{"current_steps": 987, "total_steps": 1230, "loss": 0.197, "lr": 4.570216403561141e-06, "epoch": 4.0050632911392405, "percentage": 80.24, "elapsed_time": "4:30:07", "remaining_time": "1:06:30"}
|
| 1103 |
+
{"current_steps": 988, "total_steps": 1230, "loss": 0.2262, "lr": 4.534166308795815e-06, "epoch": 4.009113924050633, "percentage": 80.33, "elapsed_time": "4:30:36", "remaining_time": "1:06:17"}
|
| 1104 |
+
{"current_steps": 989, "total_steps": 1230, "loss": 0.1877, "lr": 4.498240773728859e-06, "epoch": 4.013164556962026, "percentage": 80.41, "elapsed_time": "4:31:10", "remaining_time": "1:06:04"}
|
| 1105 |
+
{"current_steps": 990, "total_steps": 1230, "loss": 0.2029, "lr": 4.462440087699609e-06, "epoch": 4.017215189873418, "percentage": 80.49, "elapsed_time": "4:31:39", "remaining_time": "1:05:51"}
|
| 1106 |
+
{"current_steps": 991, "total_steps": 1230, "loss": 0.195, "lr": 4.426764539041861e-06, "epoch": 4.02126582278481, "percentage": 80.57, "elapsed_time": "4:32:13", "remaining_time": "1:05:39"}
|