File size: 27,947 Bytes
f4d3a47
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
{"current_steps": 5, "total_steps": 690, "loss": 1.3988, "lr": 5.7142857142857145e-06, "epoch": 0.01451378809869376, "percentage": 0.72, "elapsed_time": "0:00:19", "remaining_time": "0:44:25"}
{"current_steps": 10, "total_steps": 690, "loss": 1.395, "lr": 1.2857142857142857e-05, "epoch": 0.02902757619738752, "percentage": 1.45, "elapsed_time": "0:00:35", "remaining_time": "0:39:59"}
{"current_steps": 15, "total_steps": 690, "loss": 1.2558, "lr": 2e-05, "epoch": 0.04354136429608128, "percentage": 2.17, "elapsed_time": "0:00:56", "remaining_time": "0:42:02"}
{"current_steps": 20, "total_steps": 690, "loss": 1.1799, "lr": 2.714285714285714e-05, "epoch": 0.05805515239477504, "percentage": 2.9, "elapsed_time": "0:01:13", "remaining_time": "0:40:58"}
{"current_steps": 25, "total_steps": 690, "loss": 1.0813, "lr": 3.428571428571429e-05, "epoch": 0.07256894049346879, "percentage": 3.62, "elapsed_time": "0:01:31", "remaining_time": "0:40:42"}
{"current_steps": 30, "total_steps": 690, "loss": 0.9022, "lr": 4.1428571428571437e-05, "epoch": 0.08708272859216255, "percentage": 4.35, "elapsed_time": "0:02:00", "remaining_time": "0:44:07"}
{"current_steps": 35, "total_steps": 690, "loss": 0.9365, "lr": 4.8571428571428576e-05, "epoch": 0.10159651669085631, "percentage": 5.07, "elapsed_time": "0:02:25", "remaining_time": "0:45:22"}
{"current_steps": 40, "total_steps": 690, "loss": 0.993, "lr": 4.999539919507037e-05, "epoch": 0.11611030478955008, "percentage": 5.8, "elapsed_time": "0:02:40", "remaining_time": "0:43:24"}
{"current_steps": 45, "total_steps": 690, "loss": 0.9726, "lr": 4.997671132725569e-05, "epoch": 0.13062409288824384, "percentage": 6.52, "elapsed_time": "0:02:56", "remaining_time": "0:42:14"}
{"current_steps": 50, "total_steps": 690, "loss": 0.8953, "lr": 4.994365958519782e-05, "epoch": 0.14513788098693758, "percentage": 7.25, "elapsed_time": "0:03:09", "remaining_time": "0:40:29"}
{"current_steps": 55, "total_steps": 690, "loss": 0.9511, "lr": 4.989626297664602e-05, "epoch": 0.15965166908563136, "percentage": 7.97, "elapsed_time": "0:03:25", "remaining_time": "0:39:28"}
{"current_steps": 60, "total_steps": 690, "loss": 0.8398, "lr": 4.983454875894878e-05, "epoch": 0.1741654571843251, "percentage": 8.7, "elapsed_time": "0:03:43", "remaining_time": "0:39:05"}
{"current_steps": 65, "total_steps": 690, "loss": 0.9117, "lr": 4.975855242337838e-05, "epoch": 0.18867924528301888, "percentage": 9.42, "elapsed_time": "0:03:57", "remaining_time": "0:38:05"}
{"current_steps": 70, "total_steps": 690, "loss": 0.8948, "lr": 4.966831767472015e-05, "epoch": 0.20319303338171263, "percentage": 10.14, "elapsed_time": "0:04:14", "remaining_time": "0:37:34"}
{"current_steps": 75, "total_steps": 690, "loss": 0.8303, "lr": 4.956389640613828e-05, "epoch": 0.21770682148040638, "percentage": 10.87, "elapsed_time": "0:04:31", "remaining_time": "0:37:04"}
{"current_steps": 80, "total_steps": 690, "loss": 0.8798, "lr": 4.944534866933257e-05, "epoch": 0.23222060957910015, "percentage": 11.59, "elapsed_time": "0:04:47", "remaining_time": "0:36:31"}
{"current_steps": 85, "total_steps": 690, "loss": 0.8788, "lr": 4.9312742640003216e-05, "epoch": 0.2467343976777939, "percentage": 12.32, "elapsed_time": "0:05:04", "remaining_time": "0:36:06"}
{"current_steps": 90, "total_steps": 690, "loss": 0.8605, "lr": 4.9166154578643596e-05, "epoch": 0.2612481857764877, "percentage": 13.04, "elapsed_time": "0:05:22", "remaining_time": "0:35:52"}
{"current_steps": 95, "total_steps": 690, "loss": 0.8254, "lr": 4.900566878668362e-05, "epoch": 0.2757619738751814, "percentage": 13.77, "elapsed_time": "0:05:38", "remaining_time": "0:35:21"}
{"current_steps": 100, "total_steps": 690, "loss": 0.8569, "lr": 4.883137755800871e-05, "epoch": 0.29027576197387517, "percentage": 14.49, "elapsed_time": "0:05:53", "remaining_time": "0:34:48"}
{"current_steps": 100, "total_steps": 690, "eval_loss": 0.8779192566871643, "epoch": 0.29027576197387517, "percentage": 14.49, "elapsed_time": "0:06:13", "remaining_time": "0:36:43"}
{"current_steps": 105, "total_steps": 690, "loss": 0.8342, "lr": 4.864338112588245e-05, "epoch": 0.3047895500725689, "percentage": 15.22, "elapsed_time": "0:06:28", "remaining_time": "0:36:02"}
{"current_steps": 110, "total_steps": 690, "loss": 0.8117, "lr": 4.8441787605303424e-05, "epoch": 0.3193033381712627, "percentage": 15.94, "elapsed_time": "0:06:44", "remaining_time": "0:35:34"}
{"current_steps": 115, "total_steps": 690, "loss": 0.8199, "lr": 4.822671293082922e-05, "epoch": 0.33381712626995647, "percentage": 16.67, "elapsed_time": "0:07:03", "remaining_time": "0:35:17"}
{"current_steps": 120, "total_steps": 690, "loss": 0.9149, "lr": 4.799828078990357e-05, "epoch": 0.3483309143686502, "percentage": 17.39, "elapsed_time": "0:07:15", "remaining_time": "0:34:26"}
{"current_steps": 125, "total_steps": 690, "loss": 0.813, "lr": 4.775662255172486e-05, "epoch": 0.36284470246734396, "percentage": 18.12, "elapsed_time": "0:07:32", "remaining_time": "0:34:05"}
{"current_steps": 130, "total_steps": 690, "loss": 0.804, "lr": 4.750187719169692e-05, "epoch": 0.37735849056603776, "percentage": 18.84, "elapsed_time": "0:07:48", "remaining_time": "0:33:39"}
{"current_steps": 135, "total_steps": 690, "loss": 0.7661, "lr": 4.723419121150556e-05, "epoch": 0.3918722786647315, "percentage": 19.57, "elapsed_time": "0:08:10", "remaining_time": "0:33:34"}
{"current_steps": 140, "total_steps": 690, "loss": 0.8241, "lr": 4.6953718554866835e-05, "epoch": 0.40638606676342526, "percentage": 20.29, "elapsed_time": "0:08:27", "remaining_time": "0:33:12"}
{"current_steps": 145, "total_steps": 690, "loss": 0.8277, "lr": 4.666062051899538e-05, "epoch": 0.420899854862119, "percentage": 21.01, "elapsed_time": "0:08:41", "remaining_time": "0:32:38"}
{"current_steps": 150, "total_steps": 690, "loss": 0.8293, "lr": 4.635506566184399e-05, "epoch": 0.43541364296081275, "percentage": 21.74, "elapsed_time": "0:08:55", "remaining_time": "0:32:07"}
{"current_steps": 155, "total_steps": 690, "loss": 0.7338, "lr": 4.603722970516741e-05, "epoch": 0.44992743105950656, "percentage": 22.46, "elapsed_time": "0:09:13", "remaining_time": "0:31:51"}
{"current_steps": 160, "total_steps": 690, "loss": 0.8061, "lr": 4.570729543346645e-05, "epoch": 0.4644412191582003, "percentage": 23.19, "elapsed_time": "0:09:29", "remaining_time": "0:31:25"}
{"current_steps": 165, "total_steps": 690, "loss": 0.8342, "lr": 4.536545258887028e-05, "epoch": 0.47895500725689405, "percentage": 23.91, "elapsed_time": "0:09:49", "remaining_time": "0:31:14"}
{"current_steps": 170, "total_steps": 690, "loss": 0.7869, "lr": 4.501189776201755e-05, "epoch": 0.4934687953555878, "percentage": 24.64, "elapsed_time": "0:10:07", "remaining_time": "0:30:56"}
{"current_steps": 175, "total_steps": 690, "loss": 0.7554, "lr": 4.4646834278998884e-05, "epoch": 0.5079825834542816, "percentage": 25.36, "elapsed_time": "0:10:23", "remaining_time": "0:30:34"}
{"current_steps": 180, "total_steps": 690, "loss": 0.7258, "lr": 4.427047208442596e-05, "epoch": 0.5224963715529753, "percentage": 26.09, "elapsed_time": "0:10:43", "remaining_time": "0:30:22"}
{"current_steps": 185, "total_steps": 690, "loss": 0.8281, "lr": 4.388302762069435e-05, "epoch": 0.5370101596516691, "percentage": 26.81, "elapsed_time": "0:10:59", "remaining_time": "0:30:00"}
{"current_steps": 190, "total_steps": 690, "loss": 0.7811, "lr": 4.348472370350946e-05, "epoch": 0.5515239477503628, "percentage": 27.54, "elapsed_time": "0:11:16", "remaining_time": "0:29:39"}
{"current_steps": 195, "total_steps": 690, "loss": 0.8315, "lr": 4.3075789393747306e-05, "epoch": 0.5660377358490566, "percentage": 28.26, "elapsed_time": "0:11:29", "remaining_time": "0:29:09"}
{"current_steps": 200, "total_steps": 690, "loss": 0.8435, "lr": 4.2656459865723775e-05, "epoch": 0.5805515239477503, "percentage": 28.99, "elapsed_time": "0:11:43", "remaining_time": "0:28:42"}
{"current_steps": 200, "total_steps": 690, "eval_loss": 0.8247659802436829, "epoch": 0.5805515239477503, "percentage": 28.99, "elapsed_time": "0:12:02", "remaining_time": "0:29:30"}
{"current_steps": 205, "total_steps": 690, "loss": 0.7336, "lr": 4.222697627194803e-05, "epoch": 0.5950653120464441, "percentage": 29.71, "elapsed_time": "0:12:23", "remaining_time": "0:29:18"}
{"current_steps": 210, "total_steps": 690, "loss": 0.7715, "lr": 4.1787585604437926e-05, "epoch": 0.6095791001451378, "percentage": 30.43, "elapsed_time": "0:12:39", "remaining_time": "0:28:55"}
{"current_steps": 215, "total_steps": 690, "loss": 0.725, "lr": 4.133854055267725e-05, "epoch": 0.6240928882438317, "percentage": 31.16, "elapsed_time": "0:12:59", "remaining_time": "0:28:41"}
{"current_steps": 220, "total_steps": 690, "loss": 0.7568, "lr": 4.088009935829631e-05, "epoch": 0.6386066763425254, "percentage": 31.88, "elapsed_time": "0:13:18", "remaining_time": "0:28:26"}
{"current_steps": 225, "total_steps": 690, "loss": 0.8035, "lr": 4.0412525666559596e-05, "epoch": 0.6531204644412192, "percentage": 32.61, "elapsed_time": "0:13:31", "remaining_time": "0:27:57"}
{"current_steps": 230, "total_steps": 690, "loss": 0.7497, "lr": 3.993608837474585e-05, "epoch": 0.6676342525399129, "percentage": 33.33, "elapsed_time": "0:13:49", "remaining_time": "0:27:39"}
{"current_steps": 235, "total_steps": 690, "loss": 0.752, "lr": 3.9451061477507715e-05, "epoch": 0.6821480406386067, "percentage": 34.06, "elapsed_time": "0:14:08", "remaining_time": "0:27:23"}
{"current_steps": 240, "total_steps": 690, "loss": 0.7866, "lr": 3.895772390929996e-05, "epoch": 0.6966618287373004, "percentage": 34.78, "elapsed_time": "0:14:26", "remaining_time": "0:27:03"}
{"current_steps": 245, "total_steps": 690, "loss": 0.8149, "lr": 3.8456359383966934e-05, "epoch": 0.7111756168359942, "percentage": 35.51, "elapsed_time": "0:14:39", "remaining_time": "0:26:37"}
{"current_steps": 250, "total_steps": 690, "loss": 0.8159, "lr": 3.7947256231581296e-05, "epoch": 0.7256894049346879, "percentage": 36.23, "elapsed_time": "0:14:52", "remaining_time": "0:26:10"}
{"current_steps": 255, "total_steps": 690, "loss": 0.809, "lr": 3.743070723262809e-05, "epoch": 0.7402031930333817, "percentage": 36.96, "elapsed_time": "0:15:05", "remaining_time": "0:25:45"}
{"current_steps": 260, "total_steps": 690, "loss": 0.7652, "lr": 3.690700944962947e-05, "epoch": 0.7547169811320755, "percentage": 37.68, "elapsed_time": "0:15:20", "remaining_time": "0:25:22"}
{"current_steps": 265, "total_steps": 690, "loss": 0.7275, "lr": 3.637646405630673e-05, "epoch": 0.7692307692307693, "percentage": 38.41, "elapsed_time": "0:15:39", "remaining_time": "0:25:07"}
{"current_steps": 270, "total_steps": 690, "loss": 0.7794, "lr": 3.583937616437816e-05, "epoch": 0.783744557329463, "percentage": 39.13, "elapsed_time": "0:15:54", "remaining_time": "0:24:44"}
{"current_steps": 275, "total_steps": 690, "loss": 0.7496, "lr": 3.529605464809208e-05, "epoch": 0.7982583454281568, "percentage": 39.86, "elapsed_time": "0:16:13", "remaining_time": "0:24:28"}
{"current_steps": 280, "total_steps": 690, "loss": 0.7894, "lr": 3.4746811966596196e-05, "epoch": 0.8127721335268505, "percentage": 40.58, "elapsed_time": "0:16:30", "remaining_time": "0:24:09"}
{"current_steps": 285, "total_steps": 690, "loss": 0.7222, "lr": 3.419196398424521e-05, "epoch": 0.8272859216255443, "percentage": 41.3, "elapsed_time": "0:16:49", "remaining_time": "0:23:54"}
{"current_steps": 290, "total_steps": 690, "loss": 0.7631, "lr": 3.363182978895019e-05, "epoch": 0.841799709724238, "percentage": 42.03, "elapsed_time": "0:17:07", "remaining_time": "0:23:36"}
{"current_steps": 295, "total_steps": 690, "loss": 0.7486, "lr": 3.306673150867407e-05, "epoch": 0.8563134978229318, "percentage": 42.75, "elapsed_time": "0:17:24", "remaining_time": "0:23:18"}
{"current_steps": 300, "total_steps": 690, "loss": 0.7267, "lr": 3.249699412617883e-05, "epoch": 0.8708272859216255, "percentage": 43.48, "elapsed_time": "0:17:46", "remaining_time": "0:23:07"}
{"current_steps": 300, "total_steps": 690, "eval_loss": 0.8032158613204956, "epoch": 0.8708272859216255, "percentage": 43.48, "elapsed_time": "0:18:06", "remaining_time": "0:23:32"}
{"current_steps": 305, "total_steps": 690, "loss": 0.7453, "lr": 3.1922945292131006e-05, "epoch": 0.8853410740203193, "percentage": 44.2, "elapsed_time": "0:18:25", "remaining_time": "0:23:15"}
{"current_steps": 310, "total_steps": 690, "loss": 0.7828, "lr": 3.1344915136672784e-05, "epoch": 0.8998548621190131, "percentage": 44.93, "elapsed_time": "0:18:39", "remaining_time": "0:22:51"}
{"current_steps": 315, "total_steps": 690, "loss": 0.7636, "lr": 3.076323607956723e-05, "epoch": 0.9143686502177069, "percentage": 45.65, "elapsed_time": "0:18:55", "remaining_time": "0:22:31"}
{"current_steps": 320, "total_steps": 690, "loss": 0.7274, "lr": 3.0178242639026792e-05, "epoch": 0.9288824383164006, "percentage": 46.38, "elapsed_time": "0:19:17", "remaining_time": "0:22:18"}
{"current_steps": 325, "total_steps": 690, "loss": 0.7282, "lr": 2.959027123933501e-05, "epoch": 0.9433962264150944, "percentage": 47.1, "elapsed_time": "0:19:35", "remaining_time": "0:22:00"}
{"current_steps": 330, "total_steps": 690, "loss": 0.7825, "lr": 2.899966001737199e-05, "epoch": 0.9579100145137881, "percentage": 47.83, "elapsed_time": "0:19:53", "remaining_time": "0:21:41"}
{"current_steps": 335, "total_steps": 690, "loss": 0.7657, "lr": 2.840674862815506e-05, "epoch": 0.9724238026124818, "percentage": 48.55, "elapsed_time": "0:20:08", "remaining_time": "0:21:20"}
{"current_steps": 340, "total_steps": 690, "loss": 0.7861, "lr": 2.7811878049506362e-05, "epoch": 0.9869375907111756, "percentage": 49.28, "elapsed_time": "0:20:24", "remaining_time": "0:21:00"}
{"current_steps": 345, "total_steps": 690, "loss": 0.7343, "lr": 2.7215390385959598e-05, "epoch": 1.0, "percentage": 50.0, "elapsed_time": "0:20:42", "remaining_time": "0:20:42"}
{"current_steps": 350, "total_steps": 690, "loss": 0.665, "lr": 2.6617628672018997e-05, "epoch": 1.0145137880986939, "percentage": 50.72, "elapsed_time": "0:21:03", "remaining_time": "0:20:26"}
{"current_steps": 355, "total_steps": 690, "loss": 0.6674, "lr": 2.6018936674883277e-05, "epoch": 1.0290275761973875, "percentage": 51.45, "elapsed_time": "0:21:23", "remaining_time": "0:20:10"}
{"current_steps": 360, "total_steps": 690, "loss": 0.7013, "lr": 2.541965869674838e-05, "epoch": 1.0435413642960814, "percentage": 52.17, "elapsed_time": "0:21:42", "remaining_time": "0:19:54"}
{"current_steps": 365, "total_steps": 690, "loss": 0.6625, "lr": 2.482013937680245e-05, "epoch": 1.058055152394775, "percentage": 52.9, "elapsed_time": "0:22:02", "remaining_time": "0:19:37"}
{"current_steps": 370, "total_steps": 690, "loss": 0.6697, "lr": 2.4220723493027087e-05, "epoch": 1.0725689404934688, "percentage": 53.62, "elapsed_time": "0:22:27", "remaining_time": "0:19:25"}
{"current_steps": 375, "total_steps": 690, "loss": 0.7241, "lr": 2.3621755763918688e-05, "epoch": 1.0870827285921625, "percentage": 54.35, "elapsed_time": "0:22:43", "remaining_time": "0:19:05"}
{"current_steps": 380, "total_steps": 690, "loss": 0.6989, "lr": 2.302358065024409e-05, "epoch": 1.1015965166908563, "percentage": 55.07, "elapsed_time": "0:23:01", "remaining_time": "0:18:46"}
{"current_steps": 385, "total_steps": 690, "loss": 0.6757, "lr": 2.242654215694435e-05, "epoch": 1.11611030478955, "percentage": 55.8, "elapsed_time": "0:23:20", "remaining_time": "0:18:29"}
{"current_steps": 390, "total_steps": 690, "loss": 0.7151, "lr": 2.183098363530076e-05, "epoch": 1.1306240928882438, "percentage": 56.52, "elapsed_time": "0:23:38", "remaining_time": "0:18:10"}
{"current_steps": 395, "total_steps": 690, "loss": 0.7134, "lr": 2.123724758547664e-05, "epoch": 1.1451378809869377, "percentage": 57.25, "elapsed_time": "0:23:52", "remaining_time": "0:17:50"}
{"current_steps": 400, "total_steps": 690, "loss": 0.7409, "lr": 2.0645675459548757e-05, "epoch": 1.1596516690856313, "percentage": 57.97, "elapsed_time": "0:24:08", "remaining_time": "0:17:30"}
{"current_steps": 400, "total_steps": 690, "eval_loss": 0.7901310324668884, "epoch": 1.1596516690856313, "percentage": 57.97, "elapsed_time": "0:24:28", "remaining_time": "0:17:44"}
{"current_steps": 405, "total_steps": 690, "loss": 0.7311, "lr": 2.005660746514138e-05, "epoch": 1.1741654571843252, "percentage": 58.7, "elapsed_time": "0:24:46", "remaining_time": "0:17:25"}
{"current_steps": 410, "total_steps": 690, "loss": 0.7251, "lr": 1.9470382369776034e-05, "epoch": 1.1886792452830188, "percentage": 59.42, "elapsed_time": "0:24:59", "remaining_time": "0:17:03"}
{"current_steps": 415, "total_steps": 690, "loss": 0.6886, "lr": 1.8887337306049473e-05, "epoch": 1.2031930333817127, "percentage": 60.14, "elapsed_time": "0:25:16", "remaining_time": "0:16:44"}
{"current_steps": 420, "total_steps": 690, "loss": 0.6796, "lr": 1.830780757775185e-05, "epoch": 1.2177068214804063, "percentage": 60.87, "elapsed_time": "0:25:38", "remaining_time": "0:16:29"}
{"current_steps": 425, "total_steps": 690, "loss": 0.6463, "lr": 1.773212646703662e-05, "epoch": 1.2322206095791002, "percentage": 61.59, "elapsed_time": "0:25:58", "remaining_time": "0:16:12"}
{"current_steps": 430, "total_steps": 690, "loss": 0.7149, "lr": 1.7160625042753088e-05, "epoch": 1.2467343976777938, "percentage": 62.32, "elapsed_time": "0:26:13", "remaining_time": "0:15:51"}
{"current_steps": 435, "total_steps": 690, "loss": 0.7487, "lr": 1.6593631970051792e-05, "epoch": 1.2612481857764877, "percentage": 63.04, "elapsed_time": "0:26:27", "remaining_time": "0:15:30"}
{"current_steps": 440, "total_steps": 690, "loss": 0.7117, "lr": 1.6031473321372215e-05, "epoch": 1.2757619738751815, "percentage": 63.77, "elapsed_time": "0:26:42", "remaining_time": "0:15:10"}
{"current_steps": 445, "total_steps": 690, "loss": 0.6477, "lr": 1.547447238892159e-05, "epoch": 1.2902757619738752, "percentage": 64.49, "elapsed_time": "0:27:01", "remaining_time": "0:14:52"}
{"current_steps": 450, "total_steps": 690, "loss": 0.6712, "lr": 1.492294949875255e-05, "epoch": 1.3047895500725688, "percentage": 65.22, "elapsed_time": "0:27:19", "remaining_time": "0:14:34"}
{"current_steps": 455, "total_steps": 690, "loss": 0.7064, "lr": 1.437722182654659e-05, "epoch": 1.3193033381712627, "percentage": 65.94, "elapsed_time": "0:27:37", "remaining_time": "0:14:16"}
{"current_steps": 460, "total_steps": 690, "loss": 0.732, "lr": 1.3837603215209272e-05, "epoch": 1.3338171262699565, "percentage": 66.67, "elapsed_time": "0:27:51", "remaining_time": "0:13:55"}
{"current_steps": 465, "total_steps": 690, "loss": 0.7432, "lr": 1.3304403994382125e-05, "epoch": 1.3483309143686502, "percentage": 67.39, "elapsed_time": "0:28:06", "remaining_time": "0:13:35"}
{"current_steps": 470, "total_steps": 690, "loss": 0.7288, "lr": 1.2777930801974917e-05, "epoch": 1.362844702467344, "percentage": 68.12, "elapsed_time": "0:28:22", "remaining_time": "0:13:16"}
{"current_steps": 475, "total_steps": 690, "loss": 0.6967, "lr": 1.2258486407821082e-05, "epoch": 1.3773584905660377, "percentage": 68.84, "elapsed_time": "0:28:36", "remaining_time": "0:12:57"}
{"current_steps": 480, "total_steps": 690, "loss": 0.7243, "lr": 1.1746369539557606e-05, "epoch": 1.3918722786647315, "percentage": 69.57, "elapsed_time": "0:28:51", "remaining_time": "0:12:37"}
{"current_steps": 485, "total_steps": 690, "loss": 0.7066, "lr": 1.124187471082947e-05, "epoch": 1.4063860667634254, "percentage": 70.29, "elapsed_time": "0:29:09", "remaining_time": "0:12:19"}
{"current_steps": 490, "total_steps": 690, "loss": 0.6855, "lr": 1.0745292051917716e-05, "epoch": 1.420899854862119, "percentage": 71.01, "elapsed_time": "0:29:32", "remaining_time": "0:12:03"}
{"current_steps": 495, "total_steps": 690, "loss": 0.7094, "lr": 1.0256907142888111e-05, "epoch": 1.4354136429608126, "percentage": 71.74, "elapsed_time": "0:29:46", "remaining_time": "0:11:43"}
{"current_steps": 500, "total_steps": 690, "loss": 0.663, "lr": 9.777000849356785e-06, "epoch": 1.4499274310595065, "percentage": 72.46, "elapsed_time": "0:30:02", "remaining_time": "0:11:25"}
{"current_steps": 500, "total_steps": 690, "eval_loss": 0.7801858186721802, "epoch": 1.4499274310595065, "percentage": 72.46, "elapsed_time": "0:30:22", "remaining_time": "0:11:32"}
{"current_steps": 505, "total_steps": 690, "loss": 0.7131, "lr": 9.305849160966994e-06, "epoch": 1.4644412191582004, "percentage": 73.19, "elapsed_time": "0:30:44", "remaining_time": "0:11:15"}
{"current_steps": 510, "total_steps": 690, "loss": 0.6971, "lr": 8.843723032670036e-06, "epoch": 1.478955007256894, "percentage": 73.91, "elapsed_time": "0:30:58", "remaining_time": "0:10:55"}
{"current_steps": 515, "total_steps": 690, "loss": 0.6897, "lr": 8.390888228901615e-06, "epoch": 1.4934687953555879, "percentage": 74.64, "elapsed_time": "0:31:15", "remaining_time": "0:10:37"}
{"current_steps": 520, "total_steps": 690, "loss": 0.751, "lr": 7.947605170743138e-06, "epoch": 1.5079825834542815, "percentage": 75.36, "elapsed_time": "0:31:26", "remaining_time": "0:10:16"}
{"current_steps": 525, "total_steps": 690, "loss": 0.676, "lr": 7.514128786156052e-06, "epoch": 1.5224963715529753, "percentage": 76.09, "elapsed_time": "0:31:44", "remaining_time": "0:09:58"}
{"current_steps": 530, "total_steps": 690, "loss": 0.6759, "lr": 7.090708363375026e-06, "epoch": 1.5370101596516692, "percentage": 76.81, "elapsed_time": "0:32:01", "remaining_time": "0:09:40"}
{"current_steps": 535, "total_steps": 690, "loss": 0.6602, "lr": 6.677587407544739e-06, "epoch": 1.5515239477503628, "percentage": 77.54, "elapsed_time": "0:32:24", "remaining_time": "0:09:23"}
{"current_steps": 540, "total_steps": 690, "loss": 0.6924, "lr": 6.275003500682258e-06, "epoch": 1.5660377358490565, "percentage": 78.26, "elapsed_time": "0:32:39", "remaining_time": "0:09:04"}
{"current_steps": 545, "total_steps": 690, "loss": 0.6922, "lr": 5.8831881650458414e-06, "epoch": 1.5805515239477503, "percentage": 78.99, "elapsed_time": "0:32:56", "remaining_time": "0:08:45"}
{"current_steps": 550, "total_steps": 690, "loss": 0.6655, "lr": 5.502366729988662e-06, "epoch": 1.5950653120464442, "percentage": 79.71, "elapsed_time": "0:33:13", "remaining_time": "0:08:27"}
{"current_steps": 555, "total_steps": 690, "loss": 0.6586, "lr": 5.132758202373972e-06, "epoch": 1.6095791001451378, "percentage": 80.43, "elapsed_time": "0:33:31", "remaining_time": "0:08:09"}
{"current_steps": 560, "total_steps": 690, "loss": 0.6834, "lr": 4.7745751406263165e-06, "epoch": 1.6240928882438317, "percentage": 81.16, "elapsed_time": "0:33:45", "remaining_time": "0:07:50"}
{"current_steps": 565, "total_steps": 690, "loss": 0.6767, "lr": 4.428023532491138e-06, "epoch": 1.6386066763425253, "percentage": 81.88, "elapsed_time": "0:34:05", "remaining_time": "0:07:32"}
{"current_steps": 570, "total_steps": 690, "loss": 0.6365, "lr": 4.093302676573154e-06, "epoch": 1.6531204644412192, "percentage": 82.61, "elapsed_time": "0:34:26", "remaining_time": "0:07:15"}
{"current_steps": 575, "total_steps": 690, "loss": 0.717, "lr": 3.7706050677215944e-06, "epoch": 1.667634252539913, "percentage": 83.33, "elapsed_time": "0:34:41", "remaining_time": "0:06:56"}
{"current_steps": 580, "total_steps": 690, "loss": 0.68, "lr": 3.4601162863281746e-06, "epoch": 1.6821480406386067, "percentage": 84.06, "elapsed_time": "0:35:00", "remaining_time": "0:06:38"}
{"current_steps": 585, "total_steps": 690, "loss": 0.7526, "lr": 3.162014891601575e-06, "epoch": 1.6966618287373003, "percentage": 84.78, "elapsed_time": "0:35:11", "remaining_time": "0:06:19"}
{"current_steps": 590, "total_steps": 690, "loss": 0.648, "lr": 2.876472318879675e-06, "epoch": 1.7111756168359942, "percentage": 85.51, "elapsed_time": "0:35:28", "remaining_time": "0:06:00"}
{"current_steps": 595, "total_steps": 690, "loss": 0.697, "lr": 2.6036527810387012e-06, "epoch": 1.725689404934688, "percentage": 86.23, "elapsed_time": "0:35:42", "remaining_time": "0:05:42"}
{"current_steps": 600, "total_steps": 690, "loss": 0.7083, "lr": 2.343713174055917e-06, "epoch": 1.7402031930333817, "percentage": 86.96, "elapsed_time": "0:35:56", "remaining_time": "0:05:23"}
{"current_steps": 600, "total_steps": 690, "eval_loss": 0.7767183780670166, "epoch": 1.7402031930333817, "percentage": 86.96, "elapsed_time": "0:36:15", "remaining_time": "0:05:26"}
{"current_steps": 605, "total_steps": 690, "loss": 0.6615, "lr": 2.0968029867802245e-06, "epoch": 1.7547169811320755, "percentage": 87.68, "elapsed_time": "0:36:34", "remaining_time": "0:05:08"}
{"current_steps": 610, "total_steps": 690, "loss": 0.6918, "lr": 1.8630642149624984e-06, "epoch": 1.7692307692307692, "percentage": 88.41, "elapsed_time": "0:36:50", "remaining_time": "0:04:49"}
{"current_steps": 615, "total_steps": 690, "loss": 0.7056, "lr": 1.642631279595161e-06, "epoch": 1.783744557329463, "percentage": 89.13, "elapsed_time": "0:37:09", "remaining_time": "0:04:31"}
{"current_steps": 620, "total_steps": 690, "loss": 0.6898, "lr": 1.435630949607933e-06, "epoch": 1.7982583454281569, "percentage": 89.86, "elapsed_time": "0:37:26", "remaining_time": "0:04:13"}
{"current_steps": 625, "total_steps": 690, "loss": 0.6623, "lr": 1.2421822689641704e-06, "epoch": 1.8127721335268505, "percentage": 90.58, "elapsed_time": "0:37:45", "remaining_time": "0:03:55"}
{"current_steps": 630, "total_steps": 690, "loss": 0.7124, "lr": 1.0623964881998267e-06, "epoch": 1.8272859216255442, "percentage": 91.3, "elapsed_time": "0:37:59", "remaining_time": "0:03:37"}
{"current_steps": 635, "total_steps": 690, "loss": 0.6846, "lr": 8.963770004442707e-07, "epoch": 1.841799709724238, "percentage": 92.03, "elapsed_time": "0:38:15", "remaining_time": "0:03:18"}
{"current_steps": 640, "total_steps": 690, "loss": 0.6931, "lr": 7.44219281959882e-07, "epoch": 1.8563134978229319, "percentage": 92.75, "elapsed_time": "0:38:31", "remaining_time": "0:03:00"}
{"current_steps": 645, "total_steps": 690, "loss": 0.6756, "lr": 6.060108372345358e-07, "epoch": 1.8708272859216255, "percentage": 93.48, "elapsed_time": "0:38:51", "remaining_time": "0:02:42"}
{"current_steps": 650, "total_steps": 690, "loss": 0.6955, "lr": 4.818311486585791e-07, "epoch": 1.8853410740203191, "percentage": 94.2, "elapsed_time": "0:39:07", "remaining_time": "0:02:24"}
{"current_steps": 655, "total_steps": 690, "loss": 0.6549, "lr": 3.7175163081526187e-07, "epoch": 1.899854862119013, "percentage": 94.93, "elapsed_time": "0:39:25", "remaining_time": "0:02:06"}
{"current_steps": 660, "total_steps": 690, "loss": 0.6645, "lr": 2.758355894108555e-07, "epoch": 1.9143686502177069, "percentage": 95.65, "elapsed_time": "0:39:45", "remaining_time": "0:01:48"}
{"current_steps": 665, "total_steps": 690, "loss": 0.675, "lr": 1.941381848681506e-07, "epoch": 1.9288824383164007, "percentage": 96.38, "elapsed_time": "0:40:03", "remaining_time": "0:01:30"}
{"current_steps": 670, "total_steps": 690, "loss": 0.6556, "lr": 1.267064006041957e-07, "epoch": 1.9433962264150944, "percentage": 97.1, "elapsed_time": "0:40:23", "remaining_time": "0:01:12"}
{"current_steps": 675, "total_steps": 690, "loss": 0.7047, "lr": 7.357901601058037e-08, "epoch": 1.957910014513788, "percentage": 97.83, "elapsed_time": "0:40:38", "remaining_time": "0:00:54"}
{"current_steps": 680, "total_steps": 690, "loss": 0.669, "lr": 3.4786584151766386e-08, "epoch": 1.9724238026124818, "percentage": 98.55, "elapsed_time": "0:40:55", "remaining_time": "0:00:36"}
{"current_steps": 685, "total_steps": 690, "loss": 0.6589, "lr": 1.0351414194298414e-08, "epoch": 1.9869375907111757, "percentage": 99.28, "elapsed_time": "0:41:14", "remaining_time": "0:00:18"}
{"current_steps": 690, "total_steps": 690, "loss": 0.7122, "lr": 2.8755857701956436e-10, "epoch": 2.0, "percentage": 100.0, "elapsed_time": "0:41:28", "remaining_time": "0:00:00"}
{"current_steps": 690, "total_steps": 690, "epoch": 2.0, "percentage": 100.0, "elapsed_time": "0:41:28", "remaining_time": "0:00:00"}