Training in progress, epoch 3
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:32bba6402607af549609242ba3d1a07ffc0b7afee239fde05c4093c4ade88f97
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e0acb954c3c192d1ca1d15894685f13205792f1a73d9e404acd49fb5927dd4b0
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:219fa841f37389166f260563267cada4dcf9bffcfa719b3b28890772909564ea
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:495c868254edd3388d52e42f66630793d5551e0a173a6be54f657d63060635be
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -720,3 +720,242 @@
|
|
| 720 |
{"current_steps": 720, "total_steps": 1195, "loss": 0.2541, "lr": 1.6367262980411273e-05, "epoch": 3.004694835680751, "percentage": 60.25, "elapsed_time": "7:53:07", "remaining_time": "5:12:07"}
|
| 721 |
{"current_steps": 721, "total_steps": 1195, "loss": 0.2596, "lr": 1.6309802586311523e-05, "epoch": 3.00886802295253, "percentage": 60.33, "elapsed_time": "7:53:48", "remaining_time": "5:11:29"}
|
| 722 |
{"current_steps": 722, "total_steps": 1195, "loss": 0.2529, "lr": 1.6252373708285505e-05, "epoch": 3.013041210224309, "percentage": 60.42, "elapsed_time": "7:54:28", "remaining_time": "5:10:50"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 720 |
{"current_steps": 720, "total_steps": 1195, "loss": 0.2541, "lr": 1.6367262980411273e-05, "epoch": 3.004694835680751, "percentage": 60.25, "elapsed_time": "7:53:07", "remaining_time": "5:12:07"}
|
| 721 |
{"current_steps": 721, "total_steps": 1195, "loss": 0.2596, "lr": 1.6309802586311523e-05, "epoch": 3.00886802295253, "percentage": 60.33, "elapsed_time": "7:53:48", "remaining_time": "5:11:29"}
|
| 722 |
{"current_steps": 722, "total_steps": 1195, "loss": 0.2529, "lr": 1.6252373708285505e-05, "epoch": 3.013041210224309, "percentage": 60.42, "elapsed_time": "7:54:28", "remaining_time": "5:10:50"}
|
| 723 |
+
{"current_steps": 723, "total_steps": 1195, "loss": 0.2517, "lr": 1.6194976836803674e-05, "epoch": 3.0172143974960877, "percentage": 60.5, "elapsed_time": "7:55:08", "remaining_time": "5:10:11"}
|
| 724 |
+
{"current_steps": 724, "total_steps": 1195, "loss": 0.2586, "lr": 1.6137612462063112e-05, "epoch": 3.0213875847678664, "percentage": 60.59, "elapsed_time": "7:55:48", "remaining_time": "5:09:32"}
|
| 725 |
+
{"current_steps": 725, "total_steps": 1195, "loss": 0.2599, "lr": 1.6080281073983375e-05, "epoch": 3.025560772039645, "percentage": 60.67, "elapsed_time": "7:56:21", "remaining_time": "5:08:48"}
|
| 726 |
+
{"current_steps": 726, "total_steps": 1195, "loss": 0.2585, "lr": 1.602298316220229e-05, "epoch": 3.0297339593114243, "percentage": 60.75, "elapsed_time": "7:56:55", "remaining_time": "5:08:05"}
|
| 727 |
+
{"current_steps": 727, "total_steps": 1195, "loss": 0.2641, "lr": 1.5965719216071776e-05, "epoch": 3.033907146583203, "percentage": 60.84, "elapsed_time": "7:57:34", "remaining_time": "5:07:26"}
|
| 728 |
+
{"current_steps": 728, "total_steps": 1195, "loss": 0.2599, "lr": 1.590848972465369e-05, "epoch": 3.0380803338549818, "percentage": 60.92, "elapsed_time": "7:58:09", "remaining_time": "5:06:43"}
|
| 729 |
+
{"current_steps": 729, "total_steps": 1195, "loss": 0.2635, "lr": 1.5851295176715608e-05, "epoch": 3.0422535211267605, "percentage": 61.0, "elapsed_time": "7:58:50", "remaining_time": "5:06:05"}
|
| 730 |
+
{"current_steps": 730, "total_steps": 1195, "loss": 0.2608, "lr": 1.5794136060726682e-05, "epoch": 3.0464267083985392, "percentage": 61.09, "elapsed_time": "7:59:32", "remaining_time": "5:05:27"}
|
| 731 |
+
{"current_steps": 731, "total_steps": 1195, "loss": 0.254, "lr": 1.573701286485344e-05, "epoch": 3.0505998956703184, "percentage": 61.17, "elapsed_time": "8:00:12", "remaining_time": "5:04:48"}
|
| 732 |
+
{"current_steps": 732, "total_steps": 1195, "loss": 0.2358, "lr": 1.5679926076955677e-05, "epoch": 3.054773082942097, "percentage": 61.26, "elapsed_time": "8:00:58", "remaining_time": "5:04:13"}
|
| 733 |
+
{"current_steps": 733, "total_steps": 1195, "loss": 0.2552, "lr": 1.5622876184582205e-05, "epoch": 3.058946270213876, "percentage": 61.34, "elapsed_time": "8:01:36", "remaining_time": "5:03:33"}
|
| 734 |
+
{"current_steps": 734, "total_steps": 1195, "loss": 0.2613, "lr": 1.556586367496674e-05, "epoch": 3.0631194574856546, "percentage": 61.42, "elapsed_time": "8:02:14", "remaining_time": "5:02:52"}
|
| 735 |
+
{"current_steps": 735, "total_steps": 1195, "loss": 0.2723, "lr": 1.5508889035023738e-05, "epoch": 3.0672926447574334, "percentage": 61.51, "elapsed_time": "8:02:53", "remaining_time": "5:02:13"}
|
| 736 |
+
{"current_steps": 736, "total_steps": 1195, "loss": 0.2699, "lr": 1.5451952751344227e-05, "epoch": 3.0714658320292125, "percentage": 61.59, "elapsed_time": "8:03:35", "remaining_time": "5:01:35"}
|
| 737 |
+
{"current_steps": 737, "total_steps": 1195, "loss": 0.2543, "lr": 1.539505531019166e-05, "epoch": 3.0756390193009913, "percentage": 61.67, "elapsed_time": "8:04:14", "remaining_time": "5:00:55"}
|
| 738 |
+
{"current_steps": 738, "total_steps": 1195, "loss": 0.2622, "lr": 1.533819719749775e-05, "epoch": 3.07981220657277, "percentage": 61.76, "elapsed_time": "8:04:52", "remaining_time": "5:00:15"}
|
| 739 |
+
{"current_steps": 739, "total_steps": 1195, "loss": 0.2221, "lr": 1.5281378898858318e-05, "epoch": 3.0839853938445487, "percentage": 61.84, "elapsed_time": "8:05:28", "remaining_time": "4:59:33"}
|
| 740 |
+
{"current_steps": 740, "total_steps": 1195, "loss": 0.2626, "lr": 1.522460089952916e-05, "epoch": 3.0881585811163275, "percentage": 61.92, "elapsed_time": "8:06:10", "remaining_time": "4:58:55"}
|
| 741 |
+
{"current_steps": 741, "total_steps": 1195, "loss": 0.2706, "lr": 1.5167863684421913e-05, "epoch": 3.0923317683881066, "percentage": 62.01, "elapsed_time": "8:06:46", "remaining_time": "4:58:14"}
|
| 742 |
+
{"current_steps": 742, "total_steps": 1195, "loss": 0.2667, "lr": 1.511116773809987e-05, "epoch": 3.0965049556598854, "percentage": 62.09, "elapsed_time": "8:07:23", "remaining_time": "4:57:33"}
|
| 743 |
+
{"current_steps": 743, "total_steps": 1195, "loss": 0.2656, "lr": 1.5054513544773884e-05, "epoch": 3.100678142931664, "percentage": 62.18, "elapsed_time": "8:08:06", "remaining_time": "4:56:56"}
|
| 744 |
+
{"current_steps": 744, "total_steps": 1195, "loss": 0.2363, "lr": 1.4997901588298214e-05, "epoch": 3.104851330203443, "percentage": 62.26, "elapsed_time": "8:08:43", "remaining_time": "4:56:15"}
|
| 745 |
+
{"current_steps": 745, "total_steps": 1195, "loss": 0.2487, "lr": 1.4941332352166385e-05, "epoch": 3.1090245174752216, "percentage": 62.34, "elapsed_time": "8:09:22", "remaining_time": "4:55:35"}
|
| 746 |
+
{"current_steps": 746, "total_steps": 1195, "loss": 0.2456, "lr": 1.48848063195071e-05, "epoch": 3.1131977047470007, "percentage": 62.43, "elapsed_time": "8:09:56", "remaining_time": "4:54:53"}
|
| 747 |
+
{"current_steps": 747, "total_steps": 1195, "loss": 0.2507, "lr": 1.4828323973080054e-05, "epoch": 3.1173708920187795, "percentage": 62.51, "elapsed_time": "8:10:35", "remaining_time": "4:54:13"}
|
| 748 |
+
{"current_steps": 748, "total_steps": 1195, "loss": 0.2433, "lr": 1.4771885795271847e-05, "epoch": 3.121544079290558, "percentage": 62.59, "elapsed_time": "8:11:13", "remaining_time": "4:53:33"}
|
| 749 |
+
{"current_steps": 749, "total_steps": 1195, "loss": 0.269, "lr": 1.4715492268091858e-05, "epoch": 3.125717266562337, "percentage": 62.68, "elapsed_time": "8:11:52", "remaining_time": "4:52:53"}
|
| 750 |
+
{"current_steps": 750, "total_steps": 1195, "loss": 0.244, "lr": 1.4659143873168145e-05, "epoch": 3.1298904538341157, "percentage": 62.76, "elapsed_time": "8:12:33", "remaining_time": "4:52:15"}
|
| 751 |
+
{"current_steps": 751, "total_steps": 1195, "loss": 0.2534, "lr": 1.460284109174329e-05, "epoch": 3.134063641105895, "percentage": 62.85, "elapsed_time": "8:13:15", "remaining_time": "4:51:37"}
|
| 752 |
+
{"current_steps": 752, "total_steps": 1195, "loss": 0.2547, "lr": 1.4546584404670323e-05, "epoch": 3.1382368283776736, "percentage": 62.93, "elapsed_time": "8:13:54", "remaining_time": "4:50:57"}
|
| 753 |
+
{"current_steps": 753, "total_steps": 1195, "loss": 0.2689, "lr": 1.4490374292408613e-05, "epoch": 3.1424100156494523, "percentage": 63.01, "elapsed_time": "8:14:35", "remaining_time": "4:50:19"}
|
| 754 |
+
{"current_steps": 754, "total_steps": 1195, "loss": 0.2372, "lr": 1.443421123501974e-05, "epoch": 3.146583202921231, "percentage": 63.1, "elapsed_time": "8:15:15", "remaining_time": "4:49:39"}
|
| 755 |
+
{"current_steps": 755, "total_steps": 1195, "loss": 0.2592, "lr": 1.4378095712163439e-05, "epoch": 3.15075639019301, "percentage": 63.18, "elapsed_time": "8:15:56", "remaining_time": "4:49:01"}
|
| 756 |
+
{"current_steps": 756, "total_steps": 1195, "loss": 0.2493, "lr": 1.4322028203093452e-05, "epoch": 3.1549295774647885, "percentage": 63.26, "elapsed_time": "8:16:32", "remaining_time": "4:48:20"}
|
| 757 |
+
{"current_steps": 757, "total_steps": 1195, "loss": 0.27, "lr": 1.4266009186653471e-05, "epoch": 3.1591027647365677, "percentage": 63.35, "elapsed_time": "8:17:16", "remaining_time": "4:47:43"}
|
| 758 |
+
{"current_steps": 758, "total_steps": 1195, "loss": 0.2435, "lr": 1.4210039141273032e-05, "epoch": 3.1632759520083464, "percentage": 63.43, "elapsed_time": "8:17:54", "remaining_time": "4:47:03"}
|
| 759 |
+
{"current_steps": 759, "total_steps": 1195, "loss": 0.2598, "lr": 1.4154118544963453e-05, "epoch": 3.167449139280125, "percentage": 63.51, "elapsed_time": "8:18:34", "remaining_time": "4:46:24"}
|
| 760 |
+
{"current_steps": 760, "total_steps": 1195, "loss": 0.2625, "lr": 1.409824787531371e-05, "epoch": 3.171622326551904, "percentage": 63.6, "elapsed_time": "8:19:14", "remaining_time": "4:45:45"}
|
| 761 |
+
{"current_steps": 761, "total_steps": 1195, "loss": 0.2793, "lr": 1.4042427609486393e-05, "epoch": 3.1757955138236826, "percentage": 63.68, "elapsed_time": "8:19:55", "remaining_time": "4:45:06"}
|
| 762 |
+
{"current_steps": 762, "total_steps": 1195, "loss": 0.2694, "lr": 1.3986658224213603e-05, "epoch": 3.179968701095462, "percentage": 63.77, "elapsed_time": "8:20:36", "remaining_time": "4:44:28"}
|
| 763 |
+
{"current_steps": 763, "total_steps": 1195, "loss": 0.2511, "lr": 1.393094019579293e-05, "epoch": 3.1841418883672405, "percentage": 63.85, "elapsed_time": "8:21:16", "remaining_time": "4:43:48"}
|
| 764 |
+
{"current_steps": 764, "total_steps": 1195, "loss": 0.266, "lr": 1.3875274000083319e-05, "epoch": 3.1883150756390193, "percentage": 63.93, "elapsed_time": "8:22:00", "remaining_time": "4:43:12"}
|
| 765 |
+
{"current_steps": 765, "total_steps": 1195, "loss": 0.2433, "lr": 1.3819660112501054e-05, "epoch": 3.192488262910798, "percentage": 64.02, "elapsed_time": "8:22:38", "remaining_time": "4:42:31"}
|
| 766 |
+
{"current_steps": 766, "total_steps": 1195, "loss": 0.2539, "lr": 1.3764099008015676e-05, "epoch": 3.1966614501825767, "percentage": 64.1, "elapsed_time": "8:23:21", "remaining_time": "4:41:54"}
|
| 767 |
+
{"current_steps": 767, "total_steps": 1195, "loss": 0.2716, "lr": 1.3708591161145934e-05, "epoch": 3.200834637454356, "percentage": 64.18, "elapsed_time": "8:24:01", "remaining_time": "4:41:15"}
|
| 768 |
+
{"current_steps": 768, "total_steps": 1195, "loss": 0.2387, "lr": 1.365313704595574e-05, "epoch": 3.2050078247261347, "percentage": 64.27, "elapsed_time": "8:24:37", "remaining_time": "4:40:34"}
|
| 769 |
+
{"current_steps": 769, "total_steps": 1195, "loss": 0.2683, "lr": 1.35977371360501e-05, "epoch": 3.2091810119979134, "percentage": 64.35, "elapsed_time": "8:25:11", "remaining_time": "4:39:51"}
|
| 770 |
+
{"current_steps": 770, "total_steps": 1195, "loss": 0.2503, "lr": 1.3542391904571082e-05, "epoch": 3.213354199269692, "percentage": 64.44, "elapsed_time": "8:25:48", "remaining_time": "4:39:10"}
|
| 771 |
+
{"current_steps": 771, "total_steps": 1195, "loss": 0.2478, "lr": 1.348710182419377e-05, "epoch": 3.217527386541471, "percentage": 64.52, "elapsed_time": "8:26:24", "remaining_time": "4:38:29"}
|
| 772 |
+
{"current_steps": 772, "total_steps": 1195, "loss": 0.2511, "lr": 1.3431867367122257e-05, "epoch": 3.22170057381325, "percentage": 64.6, "elapsed_time": "8:27:04", "remaining_time": "4:37:50"}
|
| 773 |
+
{"current_steps": 773, "total_steps": 1195, "loss": 0.2474, "lr": 1.3376689005085557e-05, "epoch": 3.2258737610850288, "percentage": 64.69, "elapsed_time": "8:27:40", "remaining_time": "4:37:08"}
|
| 774 |
+
{"current_steps": 774, "total_steps": 1195, "loss": 0.2664, "lr": 1.332156720933361e-05, "epoch": 3.2300469483568075, "percentage": 64.77, "elapsed_time": "8:28:19", "remaining_time": "4:36:29"}
|
| 775 |
+
{"current_steps": 775, "total_steps": 1195, "loss": 0.233, "lr": 1.326650245063326e-05, "epoch": 3.2342201356285862, "percentage": 64.85, "elapsed_time": "8:28:52", "remaining_time": "4:35:46"}
|
| 776 |
+
{"current_steps": 776, "total_steps": 1195, "loss": 0.247, "lr": 1.3211495199264216e-05, "epoch": 3.238393322900365, "percentage": 64.94, "elapsed_time": "8:29:31", "remaining_time": "4:35:06"}
|
| 777 |
+
{"current_steps": 777, "total_steps": 1195, "loss": 0.267, "lr": 1.3156545925015074e-05, "epoch": 3.242566510172144, "percentage": 65.02, "elapsed_time": "8:30:09", "remaining_time": "4:34:27"}
|
| 778 |
+
{"current_steps": 778, "total_steps": 1195, "loss": 0.2578, "lr": 1.3101655097179245e-05, "epoch": 3.246739697443923, "percentage": 65.1, "elapsed_time": "8:30:48", "remaining_time": "4:33:47"}
|
| 779 |
+
{"current_steps": 779, "total_steps": 1195, "loss": 0.2517, "lr": 1.3046823184550995e-05, "epoch": 3.2509128847157016, "percentage": 65.19, "elapsed_time": "8:31:28", "remaining_time": "4:33:08"}
|
| 780 |
+
{"current_steps": 780, "total_steps": 1195, "loss": 0.2453, "lr": 1.2992050655421413e-05, "epoch": 3.2550860719874803, "percentage": 65.27, "elapsed_time": "8:32:03", "remaining_time": "4:32:26"}
|
| 781 |
+
{"current_steps": 781, "total_steps": 1195, "loss": 0.2548, "lr": 1.2937337977574452e-05, "epoch": 3.259259259259259, "percentage": 65.36, "elapsed_time": "8:32:46", "remaining_time": "4:31:49"}
|
| 782 |
+
{"current_steps": 782, "total_steps": 1195, "loss": 0.2786, "lr": 1.2882685618282876e-05, "epoch": 3.2634324465310383, "percentage": 65.44, "elapsed_time": "8:33:26", "remaining_time": "4:31:10"}
|
| 783 |
+
{"current_steps": 783, "total_steps": 1195, "loss": 0.2458, "lr": 1.2828094044304316e-05, "epoch": 3.267605633802817, "percentage": 65.52, "elapsed_time": "8:34:05", "remaining_time": "4:30:30"}
|
| 784 |
+
{"current_steps": 784, "total_steps": 1195, "loss": 0.2759, "lr": 1.2773563721877258e-05, "epoch": 3.2717788210745957, "percentage": 65.61, "elapsed_time": "8:34:48", "remaining_time": "4:29:52"}
|
| 785 |
+
{"current_steps": 785, "total_steps": 1195, "loss": 0.2489, "lr": 1.2719095116717069e-05, "epoch": 3.2759520083463745, "percentage": 65.69, "elapsed_time": "8:35:30", "remaining_time": "4:29:14"}
|
| 786 |
+
{"current_steps": 786, "total_steps": 1195, "loss": 0.2476, "lr": 1.2664688694012042e-05, "epoch": 3.280125195618153, "percentage": 65.77, "elapsed_time": "8:36:07", "remaining_time": "4:28:34"}
|
| 787 |
+
{"current_steps": 787, "total_steps": 1195, "loss": 0.2438, "lr": 1.2610344918419379e-05, "epoch": 3.2842983828899324, "percentage": 65.86, "elapsed_time": "8:36:47", "remaining_time": "4:27:54"}
|
| 788 |
+
{"current_steps": 788, "total_steps": 1195, "loss": 0.2496, "lr": 1.2556064254061249e-05, "epoch": 3.288471570161711, "percentage": 65.94, "elapsed_time": "8:37:26", "remaining_time": "4:27:15"}
|
| 789 |
+
{"current_steps": 789, "total_steps": 1195, "loss": 0.2433, "lr": 1.2501847164520817e-05, "epoch": 3.29264475743349, "percentage": 66.03, "elapsed_time": "8:38:04", "remaining_time": "4:26:35"}
|
| 790 |
+
{"current_steps": 790, "total_steps": 1195, "loss": 0.2544, "lr": 1.2447694112838309e-05, "epoch": 3.2968179447052686, "percentage": 66.11, "elapsed_time": "8:38:43", "remaining_time": "4:25:55"}
|
| 791 |
+
{"current_steps": 791, "total_steps": 1195, "loss": 0.251, "lr": 1.239360556150702e-05, "epoch": 3.3009911319770473, "percentage": 66.19, "elapsed_time": "8:39:22", "remaining_time": "4:25:16"}
|
| 792 |
+
{"current_steps": 792, "total_steps": 1195, "loss": 0.2644, "lr": 1.2339581972469375e-05, "epoch": 3.3051643192488265, "percentage": 66.28, "elapsed_time": "8:40:02", "remaining_time": "4:24:37"}
|
| 793 |
+
{"current_steps": 793, "total_steps": 1195, "loss": 0.2462, "lr": 1.2285623807113e-05, "epoch": 3.309337506520605, "percentage": 66.36, "elapsed_time": "8:40:45", "remaining_time": "4:23:59"}
|
| 794 |
+
{"current_steps": 794, "total_steps": 1195, "loss": 0.275, "lr": 1.2231731526266774e-05, "epoch": 3.313510693792384, "percentage": 66.44, "elapsed_time": "8:41:26", "remaining_time": "4:23:20"}
|
| 795 |
+
{"current_steps": 795, "total_steps": 1195, "loss": 0.2346, "lr": 1.2177905590196884e-05, "epoch": 3.3176838810641627, "percentage": 66.53, "elapsed_time": "8:42:00", "remaining_time": "4:22:38"}
|
| 796 |
+
{"current_steps": 796, "total_steps": 1195, "loss": 0.2577, "lr": 1.2124146458602896e-05, "epoch": 3.3218570683359414, "percentage": 66.61, "elapsed_time": "8:42:37", "remaining_time": "4:21:58"}
|
| 797 |
+
{"current_steps": 797, "total_steps": 1195, "loss": 0.2589, "lr": 1.2070454590613844e-05, "epoch": 3.3260302556077206, "percentage": 66.69, "elapsed_time": "8:43:22", "remaining_time": "4:21:21"}
|
| 798 |
+
{"current_steps": 798, "total_steps": 1195, "loss": 0.2517, "lr": 1.2016830444784287e-05, "epoch": 3.3302034428794993, "percentage": 66.78, "elapsed_time": "8:44:03", "remaining_time": "4:20:43"}
|
| 799 |
+
{"current_steps": 799, "total_steps": 1195, "loss": 0.2688, "lr": 1.1963274479090417e-05, "epoch": 3.334376630151278, "percentage": 66.86, "elapsed_time": "8:44:36", "remaining_time": "4:20:00"}
|
| 800 |
+
{"current_steps": 800, "total_steps": 1195, "loss": 0.2515, "lr": 1.1909787150926128e-05, "epoch": 3.338549817423057, "percentage": 66.95, "elapsed_time": "8:45:12", "remaining_time": "4:19:19"}
|
| 801 |
+
{"current_steps": 801, "total_steps": 1195, "loss": 0.2529, "lr": 1.1856368917099114e-05, "epoch": 3.3427230046948355, "percentage": 67.03, "elapsed_time": "8:45:50", "remaining_time": "4:18:39"}
|
| 802 |
+
{"current_steps": 802, "total_steps": 1195, "loss": 0.2498, "lr": 1.1803020233826965e-05, "epoch": 3.3468961919666143, "percentage": 67.11, "elapsed_time": "8:46:31", "remaining_time": "4:18:00"}
|
| 803 |
+
{"current_steps": 803, "total_steps": 1195, "loss": 0.2563, "lr": 1.1749741556733297e-05, "epoch": 3.3510693792383934, "percentage": 67.2, "elapsed_time": "8:47:13", "remaining_time": "4:17:22"}
|
| 804 |
+
{"current_steps": 804, "total_steps": 1195, "loss": 0.2673, "lr": 1.1696533340843814e-05, "epoch": 3.355242566510172, "percentage": 67.28, "elapsed_time": "8:47:50", "remaining_time": "4:16:41"}
|
| 805 |
+
{"current_steps": 805, "total_steps": 1195, "loss": 0.2601, "lr": 1.1643396040582468e-05, "epoch": 3.359415753781951, "percentage": 67.36, "elapsed_time": "8:48:33", "remaining_time": "4:16:04"}
|
| 806 |
+
{"current_steps": 806, "total_steps": 1195, "loss": 0.2564, "lr": 1.1590330109767532e-05, "epoch": 3.3635889410537296, "percentage": 67.45, "elapsed_time": "8:49:14", "remaining_time": "4:15:25"}
|
| 807 |
+
{"current_steps": 807, "total_steps": 1195, "loss": 0.2585, "lr": 1.153733600160777e-05, "epoch": 3.3677621283255084, "percentage": 67.53, "elapsed_time": "8:49:51", "remaining_time": "4:14:45"}
|
| 808 |
+
{"current_steps": 808, "total_steps": 1195, "loss": 0.2491, "lr": 1.1484414168698547e-05, "epoch": 3.3719353155972875, "percentage": 67.62, "elapsed_time": "8:50:26", "remaining_time": "4:14:03"}
|
| 809 |
+
{"current_steps": 809, "total_steps": 1195, "loss": 0.2753, "lr": 1.1431565063017955e-05, "epoch": 3.3761085028690663, "percentage": 67.7, "elapsed_time": "8:51:04", "remaining_time": "4:13:23"}
|
| 810 |
+
{"current_steps": 810, "total_steps": 1195, "loss": 0.2472, "lr": 1.1378789135922954e-05, "epoch": 3.380281690140845, "percentage": 67.78, "elapsed_time": "8:51:42", "remaining_time": "4:12:43"}
|
| 811 |
+
{"current_steps": 811, "total_steps": 1195, "loss": 0.2555, "lr": 1.1326086838145528e-05, "epoch": 3.3844548774126237, "percentage": 67.87, "elapsed_time": "8:52:26", "remaining_time": "4:12:06"}
|
| 812 |
+
{"current_steps": 812, "total_steps": 1195, "loss": 0.263, "lr": 1.1273458619788844e-05, "epoch": 3.3886280646844025, "percentage": 67.95, "elapsed_time": "8:53:15", "remaining_time": "4:11:31"}
|
| 813 |
+
{"current_steps": 813, "total_steps": 1195, "loss": 0.2641, "lr": 1.1220904930323386e-05, "epoch": 3.3928012519561817, "percentage": 68.03, "elapsed_time": "8:53:56", "remaining_time": "4:10:52"}
|
| 814 |
+
{"current_steps": 814, "total_steps": 1195, "loss": 0.2595, "lr": 1.1168426218583109e-05, "epoch": 3.3969744392279604, "percentage": 68.12, "elapsed_time": "8:54:38", "remaining_time": "4:10:14"}
|
| 815 |
+
{"current_steps": 815, "total_steps": 1195, "loss": 0.24, "lr": 1.1116022932761648e-05, "epoch": 3.401147626499739, "percentage": 68.2, "elapsed_time": "8:55:21", "remaining_time": "4:09:37"}
|
| 816 |
+
{"current_steps": 816, "total_steps": 1195, "loss": 0.2694, "lr": 1.1063695520408442e-05, "epoch": 3.405320813771518, "percentage": 68.28, "elapsed_time": "8:55:59", "remaining_time": "4:08:56"}
|
| 817 |
+
{"current_steps": 817, "total_steps": 1195, "loss": 0.2271, "lr": 1.1011444428424946e-05, "epoch": 3.4094940010432966, "percentage": 68.37, "elapsed_time": "8:56:35", "remaining_time": "4:08:15"}
|
| 818 |
+
{"current_steps": 818, "total_steps": 1195, "loss": 0.258, "lr": 1.0959270103060814e-05, "epoch": 3.4136671883150758, "percentage": 68.45, "elapsed_time": "8:57:12", "remaining_time": "4:07:35"}
|
| 819 |
+
{"current_steps": 819, "total_steps": 1195, "loss": 0.246, "lr": 1.0907172989910046e-05, "epoch": 3.4178403755868545, "percentage": 68.54, "elapsed_time": "8:57:51", "remaining_time": "4:06:55"}
|
| 820 |
+
{"current_steps": 820, "total_steps": 1195, "loss": 0.2468, "lr": 1.085515353390723e-05, "epoch": 3.4220135628586332, "percentage": 68.62, "elapsed_time": "8:58:30", "remaining_time": "4:06:16"}
|
| 821 |
+
{"current_steps": 821, "total_steps": 1195, "loss": 0.2567, "lr": 1.0803212179323727e-05, "epoch": 3.426186750130412, "percentage": 68.7, "elapsed_time": "8:59:07", "remaining_time": "4:05:35"}
|
| 822 |
+
{"current_steps": 822, "total_steps": 1195, "loss": 0.267, "lr": 1.0751349369763882e-05, "epoch": 3.4303599374021907, "percentage": 68.79, "elapsed_time": "8:59:46", "remaining_time": "4:04:56"}
|
| 823 |
+
{"current_steps": 823, "total_steps": 1195, "loss": 0.261, "lr": 1.0699565548161191e-05, "epoch": 3.43453312467397, "percentage": 68.87, "elapsed_time": "9:00:28", "remaining_time": "4:04:17"}
|
| 824 |
+
{"current_steps": 824, "total_steps": 1195, "loss": 0.2746, "lr": 1.06478611567746e-05, "epoch": 3.4387063119457486, "percentage": 68.95, "elapsed_time": "9:01:10", "remaining_time": "4:03:39"}
|
| 825 |
+
{"current_steps": 825, "total_steps": 1195, "loss": 0.2621, "lr": 1.0596236637184631e-05, "epoch": 3.4428794992175273, "percentage": 69.04, "elapsed_time": "9:01:54", "remaining_time": "4:03:02"}
|
| 826 |
+
{"current_steps": 826, "total_steps": 1195, "loss": 0.2608, "lr": 1.0544692430289731e-05, "epoch": 3.447052686489306, "percentage": 69.12, "elapsed_time": "9:02:35", "remaining_time": "4:02:23"}
|
| 827 |
+
{"current_steps": 827, "total_steps": 1195, "loss": 0.2478, "lr": 1.0493228976302374e-05, "epoch": 3.451225873761085, "percentage": 69.21, "elapsed_time": "9:03:15", "remaining_time": "4:01:44"}
|
| 828 |
+
{"current_steps": 828, "total_steps": 1195, "loss": 0.2465, "lr": 1.0441846714745403e-05, "epoch": 3.455399061032864, "percentage": 69.29, "elapsed_time": "9:03:55", "remaining_time": "4:01:05"}
|
| 829 |
+
{"current_steps": 829, "total_steps": 1195, "loss": 0.2668, "lr": 1.0390546084448211e-05, "epoch": 3.4595722483046427, "percentage": 69.37, "elapsed_time": "9:04:36", "remaining_time": "4:00:26"}
|
| 830 |
+
{"current_steps": 830, "total_steps": 1195, "loss": 0.2687, "lr": 1.0339327523543043e-05, "epoch": 3.4637454355764214, "percentage": 69.46, "elapsed_time": "9:05:15", "remaining_time": "3:59:47"}
|
| 831 |
+
{"current_steps": 831, "total_steps": 1195, "loss": 0.2593, "lr": 1.0288191469461233e-05, "epoch": 3.4679186228482, "percentage": 69.54, "elapsed_time": "9:05:50", "remaining_time": "3:59:05"}
|
| 832 |
+
{"current_steps": 832, "total_steps": 1195, "loss": 0.248, "lr": 1.0237138358929438e-05, "epoch": 3.472091810119979, "percentage": 69.62, "elapsed_time": "9:06:32", "remaining_time": "3:58:27"}
|
| 833 |
+
{"current_steps": 833, "total_steps": 1195, "loss": 0.2555, "lr": 1.0186168627965966e-05, "epoch": 3.476264997391758, "percentage": 69.71, "elapsed_time": "9:07:04", "remaining_time": "3:57:44"}
|
| 834 |
+
{"current_steps": 834, "total_steps": 1195, "loss": 0.2548, "lr": 1.0135282711877014e-05, "epoch": 3.480438184663537, "percentage": 69.79, "elapsed_time": "9:07:40", "remaining_time": "3:57:03"}
|
| 835 |
+
{"current_steps": 835, "total_steps": 1195, "loss": 0.2704, "lr": 1.0084481045252965e-05, "epoch": 3.4846113719353156, "percentage": 69.87, "elapsed_time": "9:08:24", "remaining_time": "3:56:26"}
|
| 836 |
+
{"current_steps": 836, "total_steps": 1195, "loss": 0.2458, "lr": 1.0033764061964648e-05, "epoch": 3.4887845592070943, "percentage": 69.96, "elapsed_time": "9:09:02", "remaining_time": "3:55:46"}
|
| 837 |
+
{"current_steps": 837, "total_steps": 1195, "loss": 0.2522, "lr": 9.98313219515969e-06, "epoch": 3.492957746478873, "percentage": 70.04, "elapsed_time": "9:09:40", "remaining_time": "3:55:06"}
|
| 838 |
+
{"current_steps": 838, "total_steps": 1195, "loss": 0.2585, "lr": 9.932585877258738e-06, "epoch": 3.497130933750652, "percentage": 70.13, "elapsed_time": "9:10:18", "remaining_time": "3:54:26"}
|
| 839 |
+
{"current_steps": 839, "total_steps": 1195, "loss": 0.2693, "lr": 9.882125539951865e-06, "epoch": 3.501304121022431, "percentage": 70.21, "elapsed_time": "9:10:58", "remaining_time": "3:53:47"}
|
| 840 |
+
{"current_steps": 840, "total_steps": 1195, "loss": 0.2399, "lr": 9.83175161419478e-06, "epoch": 3.5054773082942097, "percentage": 70.29, "elapsed_time": "9:11:37", "remaining_time": "3:53:07"}
|
| 841 |
+
{"current_steps": 841, "total_steps": 1195, "loss": 0.2617, "lr": 9.781464530205226e-06, "epoch": 3.5096504955659884, "percentage": 70.38, "elapsed_time": "9:12:18", "remaining_time": "3:52:28"}
|
| 842 |
+
{"current_steps": 842, "total_steps": 1195, "loss": 0.2645, "lr": 9.73126471745925e-06, "epoch": 3.513823682837767, "percentage": 70.46, "elapsed_time": "9:12:59", "remaining_time": "3:51:50"}
|
| 843 |
+
{"current_steps": 843, "total_steps": 1195, "loss": 0.2521, "lr": 9.68115260468758e-06, "epoch": 3.5179968701095463, "percentage": 70.54, "elapsed_time": "9:13:34", "remaining_time": "3:51:09"}
|
| 844 |
+
{"current_steps": 844, "total_steps": 1195, "loss": 0.2486, "lr": 9.631128619871945e-06, "epoch": 3.522170057381325, "percentage": 70.63, "elapsed_time": "9:14:14", "remaining_time": "3:50:29"}
|
| 845 |
+
{"current_steps": 845, "total_steps": 1195, "loss": 0.2427, "lr": 9.581193190241398e-06, "epoch": 3.526343244653104, "percentage": 70.71, "elapsed_time": "9:14:59", "remaining_time": "3:49:52"}
|
| 846 |
+
{"current_steps": 846, "total_steps": 1195, "loss": 0.2631, "lr": 9.531346742268713e-06, "epoch": 3.5305164319248825, "percentage": 70.79, "elapsed_time": "9:15:46", "remaining_time": "3:49:16"}
|
| 847 |
+
{"current_steps": 847, "total_steps": 1195, "loss": 0.2733, "lr": 9.481589701666682e-06, "epoch": 3.5346896191966612, "percentage": 70.88, "elapsed_time": "9:16:28", "remaining_time": "3:48:38"}
|
| 848 |
+
{"current_steps": 848, "total_steps": 1195, "loss": 0.2582, "lr": 9.431922493384571e-06, "epoch": 3.5388628064684404, "percentage": 70.96, "elapsed_time": "9:17:00", "remaining_time": "3:47:55"}
|
| 849 |
+
{"current_steps": 849, "total_steps": 1195, "loss": 0.2542, "lr": 9.382345541604376e-06, "epoch": 3.543035993740219, "percentage": 71.05, "elapsed_time": "9:17:39", "remaining_time": "3:47:15"}
|
| 850 |
+
{"current_steps": 850, "total_steps": 1195, "loss": 0.2756, "lr": 9.332859269737303e-06, "epoch": 3.547209181011998, "percentage": 71.13, "elapsed_time": "9:18:19", "remaining_time": "3:46:36"}
|
| 851 |
+
{"current_steps": 851, "total_steps": 1195, "loss": 0.2548, "lr": 9.283464100420064e-06, "epoch": 3.5513823682837766, "percentage": 71.21, "elapsed_time": "9:18:59", "remaining_time": "3:45:57"}
|
| 852 |
+
{"current_steps": 852, "total_steps": 1195, "loss": 0.2386, "lr": 9.234160455511365e-06, "epoch": 3.5555555555555554, "percentage": 71.3, "elapsed_time": "9:19:37", "remaining_time": "3:45:17"}
|
| 853 |
+
{"current_steps": 853, "total_steps": 1195, "loss": 0.2479, "lr": 9.184948756088201e-06, "epoch": 3.5597287428273345, "percentage": 71.38, "elapsed_time": "9:20:13", "remaining_time": "3:44:36"}
|
| 854 |
+
{"current_steps": 854, "total_steps": 1195, "loss": 0.2637, "lr": 9.135829422442337e-06, "epoch": 3.5639019300991133, "percentage": 71.46, "elapsed_time": "9:20:55", "remaining_time": "3:43:58"}
|
| 855 |
+
{"current_steps": 855, "total_steps": 1195, "loss": 0.2609, "lr": 9.08680287407667e-06, "epoch": 3.568075117370892, "percentage": 71.55, "elapsed_time": "9:21:38", "remaining_time": "3:43:20"}
|
| 856 |
+
{"current_steps": 856, "total_steps": 1195, "loss": 0.2686, "lr": 9.03786952970168e-06, "epoch": 3.5722483046426707, "percentage": 71.63, "elapsed_time": "9:22:14", "remaining_time": "3:42:39"}
|
| 857 |
+
{"current_steps": 857, "total_steps": 1195, "loss": 0.2547, "lr": 8.989029807231844e-06, "epoch": 3.5764214919144495, "percentage": 71.72, "elapsed_time": "9:22:53", "remaining_time": "3:42:00"}
|
| 858 |
+
{"current_steps": 858, "total_steps": 1195, "loss": 0.2612, "lr": 8.940284123782037e-06, "epoch": 3.5805946791862286, "percentage": 71.8, "elapsed_time": "9:23:37", "remaining_time": "3:41:22"}
|
| 859 |
+
{"current_steps": 859, "total_steps": 1195, "loss": 0.2594, "lr": 8.891632895664027e-06, "epoch": 3.5847678664580074, "percentage": 71.88, "elapsed_time": "9:24:13", "remaining_time": "3:40:41"}
|
| 860 |
+
{"current_steps": 860, "total_steps": 1195, "loss": 0.2572, "lr": 8.843076538382853e-06, "epoch": 3.588941053729786, "percentage": 71.97, "elapsed_time": "9:24:51", "remaining_time": "3:40:01"}
|
| 861 |
+
{"current_steps": 861, "total_steps": 1195, "loss": 0.2554, "lr": 8.794615466633356e-06, "epoch": 3.593114241001565, "percentage": 72.05, "elapsed_time": "9:25:34", "remaining_time": "3:39:23"}
|
| 862 |
+
{"current_steps": 862, "total_steps": 1195, "loss": 0.2375, "lr": 8.74625009429655e-06, "epoch": 3.5972874282733436, "percentage": 72.13, "elapsed_time": "9:26:09", "remaining_time": "3:38:42"}
|
| 863 |
+
{"current_steps": 863, "total_steps": 1195, "loss": 0.2604, "lr": 8.697980834436159e-06, "epoch": 3.6014606155451228, "percentage": 72.22, "elapsed_time": "9:26:45", "remaining_time": "3:38:02"}
|
| 864 |
+
{"current_steps": 864, "total_steps": 1195, "loss": 0.2704, "lr": 8.649808099295031e-06, "epoch": 3.6056338028169015, "percentage": 72.3, "elapsed_time": "9:27:33", "remaining_time": "3:37:25"}
|
| 865 |
+
{"current_steps": 865, "total_steps": 1195, "loss": 0.2433, "lr": 8.601732300291674e-06, "epoch": 3.6098069900886802, "percentage": 72.38, "elapsed_time": "9:28:07", "remaining_time": "3:36:44"}
|
| 866 |
+
{"current_steps": 866, "total_steps": 1195, "loss": 0.2451, "lr": 8.553753848016702e-06, "epoch": 3.613980177360459, "percentage": 72.47, "elapsed_time": "9:28:48", "remaining_time": "3:36:05"}
|
| 867 |
+
{"current_steps": 867, "total_steps": 1195, "loss": 0.2246, "lr": 8.50587315222935e-06, "epoch": 3.6181533646322377, "percentage": 72.55, "elapsed_time": "9:29:19", "remaining_time": "3:35:23"}
|
| 868 |
+
{"current_steps": 868, "total_steps": 1195, "loss": 0.2573, "lr": 8.458090621853938e-06, "epoch": 3.622326551904017, "percentage": 72.64, "elapsed_time": "9:29:57", "remaining_time": "3:34:42"}
|
| 869 |
+
{"current_steps": 869, "total_steps": 1195, "loss": 0.2472, "lr": 8.410406664976439e-06, "epoch": 3.6264997391757956, "percentage": 72.72, "elapsed_time": "9:30:36", "remaining_time": "3:34:03"}
|
| 870 |
+
{"current_steps": 870, "total_steps": 1195, "loss": 0.2592, "lr": 8.362821688840947e-06, "epoch": 3.6306729264475743, "percentage": 72.8, "elapsed_time": "9:31:19", "remaining_time": "3:33:25"}
|
| 871 |
+
{"current_steps": 871, "total_steps": 1195, "loss": 0.2581, "lr": 8.315336099846202e-06, "epoch": 3.634846113719353, "percentage": 72.89, "elapsed_time": "9:31:58", "remaining_time": "3:32:46"}
|
| 872 |
+
{"current_steps": 872, "total_steps": 1195, "loss": 0.2524, "lr": 8.267950303542155e-06, "epoch": 3.639019300991132, "percentage": 72.97, "elapsed_time": "9:32:37", "remaining_time": "3:32:06"}
|
| 873 |
+
{"current_steps": 873, "total_steps": 1195, "loss": 0.2679, "lr": 8.220664704626442e-06, "epoch": 3.643192488262911, "percentage": 73.05, "elapsed_time": "9:33:19", "remaining_time": "3:31:27"}
|
| 874 |
+
{"current_steps": 874, "total_steps": 1195, "loss": 0.2462, "lr": 8.173479706941014e-06, "epoch": 3.6473656755346897, "percentage": 73.14, "elapsed_time": "9:33:58", "remaining_time": "3:30:48"}
|
| 875 |
+
{"current_steps": 875, "total_steps": 1195, "loss": 0.2282, "lr": 8.12639571346859e-06, "epoch": 3.6515388628064684, "percentage": 73.22, "elapsed_time": "9:34:32", "remaining_time": "3:30:07"}
|
| 876 |
+
{"current_steps": 876, "total_steps": 1195, "loss": 0.2405, "lr": 8.079413126329299e-06, "epoch": 3.655712050078247, "percentage": 73.31, "elapsed_time": "9:35:11", "remaining_time": "3:29:27"}
|
| 877 |
+
{"current_steps": 877, "total_steps": 1195, "loss": 0.241, "lr": 8.032532346777185e-06, "epoch": 3.659885237350026, "percentage": 73.39, "elapsed_time": "9:35:50", "remaining_time": "3:28:47"}
|
| 878 |
+
{"current_steps": 878, "total_steps": 1195, "loss": 0.236, "lr": 7.985753775196822e-06, "epoch": 3.664058424621805, "percentage": 73.47, "elapsed_time": "9:36:24", "remaining_time": "3:28:06"}
|
| 879 |
+
{"current_steps": 879, "total_steps": 1195, "loss": 0.2556, "lr": 7.93907781109988e-06, "epoch": 3.668231611893584, "percentage": 73.56, "elapsed_time": "9:37:04", "remaining_time": "3:27:27"}
|
| 880 |
+
{"current_steps": 880, "total_steps": 1195, "loss": 0.2328, "lr": 7.89250485312171e-06, "epoch": 3.6724047991653626, "percentage": 73.64, "elapsed_time": "9:37:34", "remaining_time": "3:26:44"}
|
| 881 |
+
{"current_steps": 881, "total_steps": 1195, "loss": 0.2706, "lr": 7.846035299017921e-06, "epoch": 3.6765779864371413, "percentage": 73.72, "elapsed_time": "9:38:16", "remaining_time": "3:26:06"}
|
| 882 |
+
{"current_steps": 882, "total_steps": 1195, "loss": 0.2422, "lr": 7.799669545661026e-06, "epoch": 3.68075117370892, "percentage": 73.81, "elapsed_time": "9:39:00", "remaining_time": "3:25:28"}
|
| 883 |
+
{"current_steps": 883, "total_steps": 1195, "loss": 0.2604, "lr": 7.753407989037032e-06, "epoch": 3.684924360980699, "percentage": 73.89, "elapsed_time": "9:39:38", "remaining_time": "3:24:48"}
|
| 884 |
+
{"current_steps": 884, "total_steps": 1195, "loss": 0.2621, "lr": 7.707251024242031e-06, "epoch": 3.689097548252478, "percentage": 73.97, "elapsed_time": "9:40:12", "remaining_time": "3:24:07"}
|
| 885 |
+
{"current_steps": 885, "total_steps": 1195, "loss": 0.2604, "lr": 7.661199045478874e-06, "epoch": 3.6932707355242567, "percentage": 74.06, "elapsed_time": "9:40:51", "remaining_time": "3:23:27"}
|
| 886 |
+
{"current_steps": 886, "total_steps": 1195, "loss": 0.2453, "lr": 7.615252446053761e-06, "epoch": 3.6974439227960354, "percentage": 74.14, "elapsed_time": "9:41:34", "remaining_time": "3:22:49"}
|
| 887 |
+
{"current_steps": 887, "total_steps": 1195, "loss": 0.2424, "lr": 7.569411618372917e-06, "epoch": 3.701617110067814, "percentage": 74.23, "elapsed_time": "9:42:11", "remaining_time": "3:22:09"}
|
| 888 |
+
{"current_steps": 888, "total_steps": 1195, "loss": 0.2477, "lr": 7.523676953939218e-06, "epoch": 3.7057902973395933, "percentage": 74.31, "elapsed_time": "9:42:50", "remaining_time": "3:21:30"}
|
| 889 |
+
{"current_steps": 889, "total_steps": 1195, "loss": 0.2593, "lr": 7.478048843348866e-06, "epoch": 3.709963484611372, "percentage": 74.39, "elapsed_time": "9:43:35", "remaining_time": "3:20:52"}
|
| 890 |
+
{"current_steps": 890, "total_steps": 1195, "loss": 0.2568, "lr": 7.432527676288015e-06, "epoch": 3.7141366718831508, "percentage": 74.48, "elapsed_time": "9:44:06", "remaining_time": "3:20:10"}
|
| 891 |
+
{"current_steps": 891, "total_steps": 1195, "loss": 0.2436, "lr": 7.387113841529494e-06, "epoch": 3.7183098591549295, "percentage": 74.56, "elapsed_time": "9:44:42", "remaining_time": "3:19:29"}
|
| 892 |
+
{"current_steps": 892, "total_steps": 1195, "loss": 0.264, "lr": 7.341807726929453e-06, "epoch": 3.7224830464267082, "percentage": 74.64, "elapsed_time": "9:45:25", "remaining_time": "3:18:51"}
|
| 893 |
+
{"current_steps": 893, "total_steps": 1195, "loss": 0.2779, "lr": 7.296609719424068e-06, "epoch": 3.7266562336984874, "percentage": 74.73, "elapsed_time": "9:46:08", "remaining_time": "3:18:13"}
|
| 894 |
+
{"current_steps": 894, "total_steps": 1195, "loss": 0.2506, "lr": 7.251520205026206e-06, "epoch": 3.730829420970266, "percentage": 74.81, "elapsed_time": "9:46:48", "remaining_time": "3:17:34"}
|
| 895 |
+
{"current_steps": 895, "total_steps": 1195, "loss": 0.2719, "lr": 7.206539568822179e-06, "epoch": 3.735002608242045, "percentage": 74.9, "elapsed_time": "9:47:30", "remaining_time": "3:16:55"}
|
| 896 |
+
{"current_steps": 896, "total_steps": 1195, "loss": 0.2377, "lr": 7.161668194968401e-06, "epoch": 3.7391757955138236, "percentage": 74.98, "elapsed_time": "9:48:08", "remaining_time": "3:16:16"}
|
| 897 |
+
{"current_steps": 897, "total_steps": 1195, "loss": 0.2643, "lr": 7.116906466688147e-06, "epoch": 3.7433489827856024, "percentage": 75.06, "elapsed_time": "9:48:46", "remaining_time": "3:15:36"}
|
| 898 |
+
{"current_steps": 898, "total_steps": 1195, "loss": 0.2326, "lr": 7.072254766268269e-06, "epoch": 3.7475221700573815, "percentage": 75.15, "elapsed_time": "9:49:24", "remaining_time": "3:14:56"}
|
| 899 |
+
{"current_steps": 899, "total_steps": 1195, "loss": 0.2527, "lr": 7.027713475055913e-06, "epoch": 3.7516953573291603, "percentage": 75.23, "elapsed_time": "9:49:59", "remaining_time": "3:14:15"}
|
| 900 |
+
{"current_steps": 900, "total_steps": 1195, "loss": 0.2667, "lr": 6.98328297345529e-06, "epoch": 3.755868544600939, "percentage": 75.31, "elapsed_time": "9:50:35", "remaining_time": "3:13:35"}
|
| 901 |
+
{"current_steps": 901, "total_steps": 1195, "loss": 0.2515, "lr": 6.938963640924405e-06, "epoch": 3.7600417318727177, "percentage": 75.4, "elapsed_time": "9:51:16", "remaining_time": "3:12:56"}
|
| 902 |
+
{"current_steps": 902, "total_steps": 1195, "loss": 0.2591, "lr": 6.894755855971842e-06, "epoch": 3.7642149191444965, "percentage": 75.48, "elapsed_time": "9:51:57", "remaining_time": "3:12:17"}
|
| 903 |
+
{"current_steps": 903, "total_steps": 1195, "loss": 0.2738, "lr": 6.850659996153488e-06, "epoch": 3.7683881064162756, "percentage": 75.56, "elapsed_time": "9:52:45", "remaining_time": "3:11:40"}
|
| 904 |
+
{"current_steps": 904, "total_steps": 1195, "loss": 0.2346, "lr": 6.806676438069359e-06, "epoch": 3.7725612936880544, "percentage": 75.65, "elapsed_time": "9:53:27", "remaining_time": "3:11:02"}
|
| 905 |
+
{"current_steps": 905, "total_steps": 1195, "loss": 0.2622, "lr": 6.762805557360335e-06, "epoch": 3.776734480959833, "percentage": 75.73, "elapsed_time": "9:54:04", "remaining_time": "3:10:21"}
|
| 906 |
+
{"current_steps": 906, "total_steps": 1195, "loss": 0.2434, "lr": 6.7190477287050125e-06, "epoch": 3.780907668231612, "percentage": 75.82, "elapsed_time": "9:54:44", "remaining_time": "3:09:42"}
|
| 907 |
+
{"current_steps": 907, "total_steps": 1195, "loss": 0.244, "lr": 6.6754033258164345e-06, "epoch": 3.7850808555033906, "percentage": 75.9, "elapsed_time": "9:55:20", "remaining_time": "3:09:02"}
|
| 908 |
+
{"current_steps": 908, "total_steps": 1195, "loss": 0.2531, "lr": 6.631872721438957e-06, "epoch": 3.7892540427751698, "percentage": 75.98, "elapsed_time": "9:55:58", "remaining_time": "3:08:22"}
|
| 909 |
+
{"current_steps": 909, "total_steps": 1195, "loss": 0.2804, "lr": 6.588456287345015e-06, "epoch": 3.7934272300469485, "percentage": 76.07, "elapsed_time": "9:56:41", "remaining_time": "3:07:44"}
|
| 910 |
+
{"current_steps": 910, "total_steps": 1195, "loss": 0.2423, "lr": 6.5451543943320005e-06, "epoch": 3.797600417318727, "percentage": 76.15, "elapsed_time": "9:57:12", "remaining_time": "3:07:02"}
|
| 911 |
+
{"current_steps": 911, "total_steps": 1195, "loss": 0.2729, "lr": 6.501967412219065e-06, "epoch": 3.801773604590506, "percentage": 76.23, "elapsed_time": "9:57:50", "remaining_time": "3:06:22"}
|
| 912 |
+
{"current_steps": 912, "total_steps": 1195, "loss": 0.2628, "lr": 6.458895709843946e-06, "epoch": 3.8059467918622847, "percentage": 76.32, "elapsed_time": "9:58:33", "remaining_time": "3:05:44"}
|
| 913 |
+
{"current_steps": 913, "total_steps": 1195, "loss": 0.238, "lr": 6.415939655059853e-06, "epoch": 3.810119979134064, "percentage": 76.4, "elapsed_time": "9:59:07", "remaining_time": "3:05:03"}
|
| 914 |
+
{"current_steps": 914, "total_steps": 1195, "loss": 0.2551, "lr": 6.373099614732308e-06, "epoch": 3.8142931664058426, "percentage": 76.49, "elapsed_time": "9:59:41", "remaining_time": "3:04:22"}
|
| 915 |
+
{"current_steps": 915, "total_steps": 1195, "loss": 0.2469, "lr": 6.330375954736014e-06, "epoch": 3.8184663536776213, "percentage": 76.57, "elapsed_time": "10:00:24", "remaining_time": "3:03:43"}
|
| 916 |
+
{"current_steps": 916, "total_steps": 1195, "loss": 0.2589, "lr": 6.287769039951716e-06, "epoch": 3.8226395409494, "percentage": 76.65, "elapsed_time": "10:01:13", "remaining_time": "3:03:07"}
|
| 917 |
+
{"current_steps": 917, "total_steps": 1195, "loss": 0.2623, "lr": 6.2452792342631215e-06, "epoch": 3.826812728221179, "percentage": 76.74, "elapsed_time": "10:01:54", "remaining_time": "3:02:28"}
|
| 918 |
+
{"current_steps": 918, "total_steps": 1195, "loss": 0.2589, "lr": 6.202906900553734e-06, "epoch": 3.830985915492958, "percentage": 76.82, "elapsed_time": "10:02:34", "remaining_time": "3:01:49"}
|
| 919 |
+
{"current_steps": 919, "total_steps": 1195, "loss": 0.2403, "lr": 6.1606524007038415e-06, "epoch": 3.8351591027647367, "percentage": 76.9, "elapsed_time": "10:03:13", "remaining_time": "3:01:09"}
|
| 920 |
+
{"current_steps": 920, "total_steps": 1195, "loss": 0.2481, "lr": 6.118516095587321e-06, "epoch": 3.8393322900365154, "percentage": 76.99, "elapsed_time": "10:03:52", "remaining_time": "3:00:30"}
|
| 921 |
+
{"current_steps": 921, "total_steps": 1195, "loss": 0.2509, "lr": 6.076498345068651e-06, "epoch": 3.843505477308294, "percentage": 77.07, "elapsed_time": "10:04:27", "remaining_time": "2:59:49"}
|
| 922 |
+
{"current_steps": 922, "total_steps": 1195, "loss": 0.2528, "lr": 6.034599507999759e-06, "epoch": 3.847678664580073, "percentage": 77.15, "elapsed_time": "10:05:02", "remaining_time": "2:59:09"}
|
| 923 |
+
{"current_steps": 923, "total_steps": 1195, "loss": 0.2412, "lr": 5.992819942217021e-06, "epoch": 3.851851851851852, "percentage": 77.24, "elapsed_time": "10:05:40", "remaining_time": "2:58:29"}
|
| 924 |
+
{"current_steps": 924, "total_steps": 1195, "loss": 0.2657, "lr": 5.951160004538177e-06, "epoch": 3.856025039123631, "percentage": 77.32, "elapsed_time": "10:06:14", "remaining_time": "2:57:48"}
|
| 925 |
+
{"current_steps": 925, "total_steps": 1195, "loss": 0.2477, "lr": 5.909620050759266e-06, "epoch": 3.8601982263954095, "percentage": 77.41, "elapsed_time": "10:06:54", "remaining_time": "2:57:09"}
|
| 926 |
+
{"current_steps": 926, "total_steps": 1195, "loss": 0.2494, "lr": 5.86820043565163e-06, "epoch": 3.8643714136671883, "percentage": 77.49, "elapsed_time": "10:07:35", "remaining_time": "2:56:30"}
|
| 927 |
+
{"current_steps": 927, "total_steps": 1195, "loss": 0.2543, "lr": 5.826901512958829e-06, "epoch": 3.868544600938967, "percentage": 77.57, "elapsed_time": "10:08:16", "remaining_time": "2:55:51"}
|
| 928 |
+
{"current_steps": 928, "total_steps": 1195, "loss": 0.2504, "lr": 5.785723635393701e-06, "epoch": 3.872717788210746, "percentage": 77.66, "elapsed_time": "10:08:54", "remaining_time": "2:55:11"}
|
| 929 |
+
{"current_steps": 929, "total_steps": 1195, "loss": 0.256, "lr": 5.744667154635246e-06, "epoch": 3.876890975482525, "percentage": 77.74, "elapsed_time": "10:09:35", "remaining_time": "2:54:32"}
|
| 930 |
+
{"current_steps": 930, "total_steps": 1195, "loss": 0.2174, "lr": 5.703732421325716e-06, "epoch": 3.8810641627543037, "percentage": 77.82, "elapsed_time": "10:10:10", "remaining_time": "2:53:52"}
|
| 931 |
+
{"current_steps": 931, "total_steps": 1195, "loss": 0.2645, "lr": 5.662919785067549e-06, "epoch": 3.8852373500260824, "percentage": 77.91, "elapsed_time": "10:10:53", "remaining_time": "2:53:13"}
|
| 932 |
+
{"current_steps": 932, "total_steps": 1195, "loss": 0.2682, "lr": 5.62222959442045e-06, "epoch": 3.889410537297861, "percentage": 77.99, "elapsed_time": "10:11:34", "remaining_time": "2:52:34"}
|
| 933 |
+
{"current_steps": 933, "total_steps": 1195, "loss": 0.2516, "lr": 5.581662196898348e-06, "epoch": 3.8935837245696403, "percentage": 78.08, "elapsed_time": "10:12:12", "remaining_time": "2:51:55"}
|
| 934 |
+
{"current_steps": 934, "total_steps": 1195, "loss": 0.2531, "lr": 5.541217938966483e-06, "epoch": 3.897756911841419, "percentage": 78.16, "elapsed_time": "10:12:51", "remaining_time": "2:51:15"}
|
| 935 |
+
{"current_steps": 935, "total_steps": 1195, "loss": 0.2591, "lr": 5.500897166038397e-06, "epoch": 3.9019300991131978, "percentage": 78.24, "elapsed_time": "10:13:29", "remaining_time": "2:50:35"}
|
| 936 |
+
{"current_steps": 936, "total_steps": 1195, "loss": 0.2395, "lr": 5.460700222473034e-06, "epoch": 3.9061032863849765, "percentage": 78.33, "elapsed_time": "10:14:05", "remaining_time": "2:49:55"}
|
| 937 |
+
{"current_steps": 937, "total_steps": 1195, "loss": 0.2309, "lr": 5.4206274515717735e-06, "epoch": 3.9102764736567552, "percentage": 78.41, "elapsed_time": "10:14:40", "remaining_time": "2:49:15"}
|
| 938 |
+
{"current_steps": 938, "total_steps": 1195, "loss": 0.2461, "lr": 5.38067919557548e-06, "epoch": 3.9144496609285344, "percentage": 78.49, "elapsed_time": "10:15:18", "remaining_time": "2:48:35"}
|
| 939 |
+
{"current_steps": 939, "total_steps": 1195, "loss": 0.2552, "lr": 5.340855795661626e-06, "epoch": 3.918622848200313, "percentage": 78.58, "elapsed_time": "10:15:58", "remaining_time": "2:47:56"}
|
| 940 |
+
{"current_steps": 940, "total_steps": 1195, "loss": 0.2478, "lr": 5.3011575919413214e-06, "epoch": 3.922796035472092, "percentage": 78.66, "elapsed_time": "10:16:39", "remaining_time": "2:47:17"}
|
| 941 |
+
{"current_steps": 941, "total_steps": 1195, "loss": 0.2457, "lr": 5.261584923456484e-06, "epoch": 3.9269692227438706, "percentage": 78.74, "elapsed_time": "10:17:22", "remaining_time": "2:46:38"}
|
| 942 |
+
{"current_steps": 942, "total_steps": 1195, "loss": 0.2309, "lr": 5.222138128176857e-06, "epoch": 3.9311424100156493, "percentage": 78.83, "elapsed_time": "10:17:55", "remaining_time": "2:45:57"}
|
| 943 |
+
{"current_steps": 943, "total_steps": 1195, "loss": 0.247, "lr": 5.182817542997196e-06, "epoch": 3.9353155972874285, "percentage": 78.91, "elapsed_time": "10:18:35", "remaining_time": "2:45:18"}
|
| 944 |
+
{"current_steps": 944, "total_steps": 1195, "loss": 0.2442, "lr": 5.143623503734334e-06, "epoch": 3.9394887845592073, "percentage": 79.0, "elapsed_time": "10:19:18", "remaining_time": "2:44:40"}
|
| 945 |
+
{"current_steps": 945, "total_steps": 1195, "loss": 0.2593, "lr": 5.104556345124363e-06, "epoch": 3.943661971830986, "percentage": 79.08, "elapsed_time": "10:19:54", "remaining_time": "2:43:59"}
|
| 946 |
+
{"current_steps": 946, "total_steps": 1195, "loss": 0.2511, "lr": 5.065616400819746e-06, "epoch": 3.9478351591027647, "percentage": 79.16, "elapsed_time": "10:20:29", "remaining_time": "2:43:19"}
|
| 947 |
+
{"current_steps": 947, "total_steps": 1195, "loss": 0.2735, "lr": 5.026804003386476e-06, "epoch": 3.9520083463745435, "percentage": 79.25, "elapsed_time": "10:21:13", "remaining_time": "2:42:41"}
|
| 948 |
+
{"current_steps": 948, "total_steps": 1195, "loss": 0.2687, "lr": 4.988119484301219e-06, "epoch": 3.9561815336463226, "percentage": 79.33, "elapsed_time": "10:21:56", "remaining_time": "2:42:02"}
|
| 949 |
+
{"current_steps": 949, "total_steps": 1195, "loss": 0.26, "lr": 4.949563173948517e-06, "epoch": 3.960354720918101, "percentage": 79.41, "elapsed_time": "10:22:34", "remaining_time": "2:41:23"}
|
| 950 |
+
{"current_steps": 950, "total_steps": 1195, "loss": 0.2533, "lr": 4.911135401617948e-06, "epoch": 3.96452790818988, "percentage": 79.5, "elapsed_time": "10:23:20", "remaining_time": "2:40:45"}
|
| 951 |
+
{"current_steps": 951, "total_steps": 1195, "loss": 0.2723, "lr": 4.872836495501292e-06, "epoch": 3.968701095461659, "percentage": 79.58, "elapsed_time": "10:24:00", "remaining_time": "2:40:06"}
|
| 952 |
+
{"current_steps": 952, "total_steps": 1195, "loss": 0.2857, "lr": 4.83466678268977e-06, "epoch": 3.9728742827334376, "percentage": 79.67, "elapsed_time": "10:24:40", "remaining_time": "2:39:27"}
|
| 953 |
+
{"current_steps": 953, "total_steps": 1195, "loss": 0.258, "lr": 4.796626589171211e-06, "epoch": 3.9770474700052167, "percentage": 79.75, "elapsed_time": "10:25:18", "remaining_time": "2:38:47"}
|
| 954 |
+
{"current_steps": 954, "total_steps": 1195, "loss": 0.2505, "lr": 4.7587162398273166e-06, "epoch": 3.981220657276995, "percentage": 79.83, "elapsed_time": "10:25:57", "remaining_time": "2:38:07"}
|
| 955 |
+
{"current_steps": 955, "total_steps": 1195, "loss": 0.2497, "lr": 4.720936058430818e-06, "epoch": 3.985393844548774, "percentage": 79.92, "elapsed_time": "10:26:42", "remaining_time": "2:37:29"}
|
| 956 |
+
{"current_steps": 956, "total_steps": 1195, "loss": 0.2362, "lr": 4.683286367642785e-06, "epoch": 3.989567031820553, "percentage": 80.0, "elapsed_time": "10:27:24", "remaining_time": "2:36:51"}
|
| 957 |
+
{"current_steps": 957, "total_steps": 1195, "loss": 0.2548, "lr": 4.6457674890098025e-06, "epoch": 3.9937402190923317, "percentage": 80.08, "elapsed_time": "10:28:03", "remaining_time": "2:36:11"}
|
| 958 |
+
{"current_steps": 958, "total_steps": 1195, "loss": 0.238, "lr": 4.6083797429612776e-06, "epoch": 3.997913406364111, "percentage": 80.17, "elapsed_time": "10:28:37", "remaining_time": "2:35:30"}
|
| 959 |
+
{"current_steps": 959, "total_steps": 1195, "loss": 0.2326, "lr": 4.571123448806673e-06, "epoch": 4.002086593635889, "percentage": 80.25, "elapsed_time": "10:30:07", "remaining_time": "2:35:04"}
|
| 960 |
+
{"current_steps": 960, "total_steps": 1195, "loss": 0.1978, "lr": 4.533998924732801e-06, "epoch": 4.006259780907668, "percentage": 80.33, "elapsed_time": "10:30:43", "remaining_time": "2:34:23"}
|
| 961 |
+
{"current_steps": 961, "total_steps": 1195, "loss": 0.1847, "lr": 4.497006487801065e-06, "epoch": 4.010432968179447, "percentage": 80.42, "elapsed_time": "10:31:19", "remaining_time": "2:33:43"}
|