sedrickkeh commited on
Commit
9f65e93
·
verified ·
1 Parent(s): afe1507

Training in progress, epoch 1

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c9211742ef2638a8ed57e216126e68d6f6ab430555ce157670307a9d027318b1
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19f365182092c5b509153d266b8509068c8c7c5f1fb6e646a2f87c817164957c
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:be5980625b0e88ac9690371e682be2d3ebaa7ecc1a272d1e76c50a082cce5f68
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7836b53c6636fbbcfa0706d7c3463107bcd4c85421a4995917f8018e908e161
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e53bf41a8b197646abb29b6c1172ac892f4499d622a9c86a7c14f10eeae1143f
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9508cf80fc9e50305e1816c5f37be7b881e76e87c2b41c9db06ae702ee7df269
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:da30cc723754323cd833dc6ee7d54aac6077268ceb077ac5155c2f7c552e802c
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94b67726d38830aac48e67a71bb14f1f2ea89b4caf7c0133a2c98e2535cf6177
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -109,3 +109,114 @@
109
  {"current_steps": 109, "total_steps": 333, "loss": 0.4834, "lr": 0.00019292652433359177, "epoch": 0.9792251544076361, "percentage": 32.73, "elapsed_time": "10:29:47", "remaining_time": "21:34:14"}
110
  {"current_steps": 110, "total_steps": 333, "loss": 0.4946, "lr": 0.00019207937130510442, "epoch": 0.9882088714205502, "percentage": 33.03, "elapsed_time": "10:35:24", "remaining_time": "21:28:09"}
111
  {"current_steps": 111, "total_steps": 333, "loss": 0.4846, "lr": 0.0001912235033538814, "epoch": 0.9971925884334644, "percentage": 33.33, "elapsed_time": "10:41:11", "remaining_time": "21:22:22"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
109
  {"current_steps": 109, "total_steps": 333, "loss": 0.4834, "lr": 0.00019292652433359177, "epoch": 0.9792251544076361, "percentage": 32.73, "elapsed_time": "10:29:47", "remaining_time": "21:34:14"}
110
  {"current_steps": 110, "total_steps": 333, "loss": 0.4946, "lr": 0.00019207937130510442, "epoch": 0.9882088714205502, "percentage": 33.03, "elapsed_time": "10:35:24", "remaining_time": "21:28:09"}
111
  {"current_steps": 111, "total_steps": 333, "loss": 0.4846, "lr": 0.0001912235033538814, "epoch": 0.9971925884334644, "percentage": 33.33, "elapsed_time": "10:41:11", "remaining_time": "21:22:22"}
112
+ {"current_steps": 112, "total_steps": 333, "loss": 0.8602, "lr": 0.00019035901496432887, "epoch": 1.0075800112296462, "percentage": 33.63, "elapsed_time": "10:47:47", "remaining_time": "21:18:13"}
113
+ {"current_steps": 113, "total_steps": 333, "loss": 0.4935, "lr": 0.0001894860015725148, "epoch": 1.0165637282425604, "percentage": 33.93, "elapsed_time": "10:53:31", "remaining_time": "21:12:21"}
114
+ {"current_steps": 114, "total_steps": 333, "loss": 0.4655, "lr": 0.0001886045595556335, "epoch": 1.0255474452554745, "percentage": 34.23, "elapsed_time": "10:59:07", "remaining_time": "21:06:13"}
115
+ {"current_steps": 115, "total_steps": 333, "loss": 0.4778, "lr": 0.00018771478622136586, "epoch": 1.0345311622683886, "percentage": 34.53, "elapsed_time": "11:04:47", "remaining_time": "21:00:13"}
116
+ {"current_steps": 116, "total_steps": 333, "loss": 0.4786, "lr": 0.0001868167797971369, "epoch": 1.0435148792813027, "percentage": 34.83, "elapsed_time": "11:10:34", "remaining_time": "20:54:25"}
117
+ {"current_steps": 117, "total_steps": 333, "loss": 0.4667, "lr": 0.00018591063941927197, "epoch": 1.0524985962942168, "percentage": 35.14, "elapsed_time": "11:16:13", "remaining_time": "20:48:24"}
118
+ {"current_steps": 118, "total_steps": 333, "loss": 0.4698, "lr": 0.00018499646512205238, "epoch": 1.0614823133071307, "percentage": 35.44, "elapsed_time": "11:22:05", "remaining_time": "20:42:47"}
119
+ {"current_steps": 119, "total_steps": 333, "loss": 0.4573, "lr": 0.00018407435782667207, "epoch": 1.0704660303200448, "percentage": 35.74, "elapsed_time": "11:27:37", "remaining_time": "20:36:34"}
120
+ {"current_steps": 120, "total_steps": 333, "loss": 0.4537, "lr": 0.0001831444193300964, "epoch": 1.079449747332959, "percentage": 36.04, "elapsed_time": "11:33:00", "remaining_time": "20:30:06"}
121
+ {"current_steps": 121, "total_steps": 333, "loss": 0.4607, "lr": 0.00018220675229382407, "epoch": 1.088433464345873, "percentage": 36.34, "elapsed_time": "11:38:49", "remaining_time": "20:24:23"}
122
+ {"current_steps": 122, "total_steps": 333, "loss": 0.4491, "lr": 0.0001812614602325536, "epoch": 1.0974171813587872, "percentage": 36.64, "elapsed_time": "11:44:45", "remaining_time": "20:18:52"}
123
+ {"current_steps": 123, "total_steps": 333, "loss": 0.4649, "lr": 0.00018030864750275598, "epoch": 1.1064008983717013, "percentage": 36.94, "elapsed_time": "11:50:25", "remaining_time": "20:12:55"}
124
+ {"current_steps": 124, "total_steps": 333, "loss": 0.4405, "lr": 0.0001793484192911539, "epoch": 1.1153846153846154, "percentage": 37.24, "elapsed_time": "11:56:11", "remaining_time": "20:07:07"}
125
+ {"current_steps": 125, "total_steps": 333, "loss": 0.4673, "lr": 0.00017838088160310975, "epoch": 1.1243683323975295, "percentage": 37.54, "elapsed_time": "12:01:47", "remaining_time": "20:01:03"}
126
+ {"current_steps": 126, "total_steps": 333, "loss": 0.4366, "lr": 0.00017740614125092276, "epoch": 1.1333520494104437, "percentage": 37.84, "elapsed_time": "12:07:23", "remaining_time": "19:55:00"}
127
+ {"current_steps": 127, "total_steps": 333, "loss": 0.4506, "lr": 0.00017642430584203776, "epoch": 1.1423357664233578, "percentage": 38.14, "elapsed_time": "12:13:05", "remaining_time": "19:49:07"}
128
+ {"current_steps": 128, "total_steps": 333, "loss": 0.4409, "lr": 0.0001754354837671654, "epoch": 1.1513194834362717, "percentage": 38.44, "elapsed_time": "12:18:55", "remaining_time": "19:43:25"}
129
+ {"current_steps": 129, "total_steps": 333, "loss": 0.455, "lr": 0.0001744397841883164, "epoch": 1.1603032004491858, "percentage": 38.74, "elapsed_time": "12:24:39", "remaining_time": "19:37:36"}
130
+ {"current_steps": 130, "total_steps": 333, "loss": 0.4453, "lr": 0.00017343731702675036, "epoch": 1.1692869174621, "percentage": 39.04, "elapsed_time": "12:30:25", "remaining_time": "19:31:49"}
131
+ {"current_steps": 131, "total_steps": 333, "loss": 0.4447, "lr": 0.00017242819295084123, "epoch": 1.178270634475014, "percentage": 39.34, "elapsed_time": "12:36:17", "remaining_time": "19:26:10"}
132
+ {"current_steps": 132, "total_steps": 333, "loss": 0.444, "lr": 0.0001714125233638595, "epoch": 1.1872543514879281, "percentage": 39.64, "elapsed_time": "12:42:07", "remaining_time": "19:20:30"}
133
+ {"current_steps": 133, "total_steps": 333, "loss": 0.4434, "lr": 0.00017039042039167416, "epoch": 1.1962380685008422, "percentage": 39.94, "elapsed_time": "12:47:58", "remaining_time": "19:14:50"}
134
+ {"current_steps": 134, "total_steps": 333, "loss": 0.4392, "lr": 0.00016936199687037412, "epoch": 1.2052217855137564, "percentage": 40.24, "elapsed_time": "12:53:38", "remaining_time": "19:08:54"}
135
+ {"current_steps": 135, "total_steps": 333, "loss": 0.44, "lr": 0.00016832736633381174, "epoch": 1.2142055025266705, "percentage": 40.54, "elapsed_time": "12:59:13", "remaining_time": "19:02:51"}
136
+ {"current_steps": 136, "total_steps": 333, "loss": 0.4395, "lr": 0.00016728664300106905, "epoch": 1.2231892195395846, "percentage": 40.84, "elapsed_time": "13:04:47", "remaining_time": "18:56:47"}
137
+ {"current_steps": 137, "total_steps": 333, "loss": 0.442, "lr": 0.0001662399417638485, "epoch": 1.2321729365524985, "percentage": 41.14, "elapsed_time": "13:10:14", "remaining_time": "18:50:34"}
138
+ {"current_steps": 138, "total_steps": 333, "loss": 0.4379, "lr": 0.00016518737817378936, "epoch": 1.2411566535654126, "percentage": 41.44, "elapsed_time": "13:15:52", "remaining_time": "18:44:36"}
139
+ {"current_steps": 139, "total_steps": 333, "loss": 0.4371, "lr": 0.0001641290684297112, "epoch": 1.2501403705783267, "percentage": 41.74, "elapsed_time": "13:21:45", "remaining_time": "18:39:00"}
140
+ {"current_steps": 140, "total_steps": 333, "loss": 0.4353, "lr": 0.00016306512936478605, "epoch": 1.2591240875912408, "percentage": 42.04, "elapsed_time": "13:27:20", "remaining_time": "18:32:58"}
141
+ {"current_steps": 141, "total_steps": 333, "loss": 0.4379, "lr": 0.00016199567843364066, "epoch": 1.268107804604155, "percentage": 42.34, "elapsed_time": "13:33:02", "remaining_time": "18:27:06"}
142
+ {"current_steps": 142, "total_steps": 333, "loss": 0.4364, "lr": 0.00016092083369938952, "epoch": 1.277091521617069, "percentage": 42.64, "elapsed_time": "13:39:08", "remaining_time": "18:21:48"}
143
+ {"current_steps": 143, "total_steps": 333, "loss": 0.4385, "lr": 0.00015984071382060174, "epoch": 1.2860752386299832, "percentage": 42.94, "elapsed_time": "13:44:35", "remaining_time": "18:15:36"}
144
+ {"current_steps": 144, "total_steps": 333, "loss": 0.4425, "lr": 0.00015875543803820115, "epoch": 1.2950589556428973, "percentage": 43.24, "elapsed_time": "13:50:24", "remaining_time": "18:09:54"}
145
+ {"current_steps": 145, "total_steps": 333, "loss": 0.4251, "lr": 0.00015766512616230286, "epoch": 1.3040426726558114, "percentage": 43.54, "elapsed_time": "13:56:10", "remaining_time": "18:04:09"}
146
+ {"current_steps": 146, "total_steps": 333, "loss": 0.4374, "lr": 0.00015656989855898653, "epoch": 1.3130263896687255, "percentage": 43.84, "elapsed_time": "14:02:10", "remaining_time": "17:58:40"}
147
+ {"current_steps": 147, "total_steps": 333, "loss": 0.4385, "lr": 0.00015546987613700858, "epoch": 1.3220101066816397, "percentage": 44.14, "elapsed_time": "14:07:53", "remaining_time": "17:52:50"}
148
+ {"current_steps": 148, "total_steps": 333, "loss": 0.4414, "lr": 0.00015436518033445427, "epoch": 1.3309938236945535, "percentage": 44.44, "elapsed_time": "14:13:52", "remaining_time": "17:47:20"}
149
+ {"current_steps": 149, "total_steps": 333, "loss": 0.4292, "lr": 0.00015325593310533135, "epoch": 1.3399775407074677, "percentage": 44.74, "elapsed_time": "14:19:59", "remaining_time": "17:42:00"}
150
+ {"current_steps": 150, "total_steps": 333, "loss": 0.4367, "lr": 0.00015214225690610695, "epoch": 1.3489612577203818, "percentage": 45.05, "elapsed_time": "14:25:55", "remaining_time": "17:36:25"}
151
+ {"current_steps": 151, "total_steps": 333, "loss": 0.4343, "lr": 0.00015102427468218884, "epoch": 1.357944974733296, "percentage": 45.35, "elapsed_time": "14:31:36", "remaining_time": "17:30:32"}
152
+ {"current_steps": 152, "total_steps": 333, "loss": 0.4225, "lr": 0.00014990210985435274, "epoch": 1.36692869174621, "percentage": 45.65, "elapsed_time": "14:37:14", "remaining_time": "17:24:36"}
153
+ {"current_steps": 153, "total_steps": 333, "loss": 0.4291, "lr": 0.00014877588630511702, "epoch": 1.3759124087591241, "percentage": 45.95, "elapsed_time": "14:42:55", "remaining_time": "17:18:44"}
154
+ {"current_steps": 154, "total_steps": 333, "loss": 0.4314, "lr": 0.0001476457283650669, "epoch": 1.3848961257720382, "percentage": 46.25, "elapsed_time": "14:48:36", "remaining_time": "17:12:52"}
155
+ {"current_steps": 155, "total_steps": 333, "loss": 0.4248, "lr": 0.00014651176079912844, "epoch": 1.3938798427849521, "percentage": 46.55, "elapsed_time": "14:54:19", "remaining_time": "17:07:01"}
156
+ {"current_steps": 156, "total_steps": 333, "loss": 0.4233, "lr": 0.00014537410879279536, "epoch": 1.4028635597978663, "percentage": 46.85, "elapsed_time": "15:00:01", "remaining_time": "17:01:10"}
157
+ {"current_steps": 157, "total_steps": 333, "loss": 0.4362, "lr": 0.00014423289793830883, "epoch": 1.4118472768107804, "percentage": 47.15, "elapsed_time": "15:05:55", "remaining_time": "16:55:33"}
158
+ {"current_steps": 158, "total_steps": 333, "loss": 0.4252, "lr": 0.00014308825422079265, "epoch": 1.4208309938236945, "percentage": 47.45, "elapsed_time": "15:11:47", "remaining_time": "16:49:53"}
159
+ {"current_steps": 159, "total_steps": 333, "loss": 0.4395, "lr": 0.00014194030400434496, "epoch": 1.4298147108366086, "percentage": 47.75, "elapsed_time": "15:17:31", "remaining_time": "16:44:05"}
160
+ {"current_steps": 160, "total_steps": 333, "loss": 0.4355, "lr": 0.00014078917401808824, "epoch": 1.4387984278495227, "percentage": 48.05, "elapsed_time": "15:23:18", "remaining_time": "16:38:19"}
161
+ {"current_steps": 161, "total_steps": 333, "loss": 0.4355, "lr": 0.0001396349913421788, "epoch": 1.4477821448624368, "percentage": 48.35, "elapsed_time": "15:29:07", "remaining_time": "16:32:36"}
162
+ {"current_steps": 162, "total_steps": 333, "loss": 0.4411, "lr": 0.00013847788339377788, "epoch": 1.456765861875351, "percentage": 48.65, "elapsed_time": "15:34:47", "remaining_time": "16:26:43"}
163
+ {"current_steps": 163, "total_steps": 333, "loss": 0.434, "lr": 0.0001373179779129849, "epoch": 1.465749578888265, "percentage": 48.95, "elapsed_time": "15:40:44", "remaining_time": "16:21:08"}
164
+ {"current_steps": 164, "total_steps": 333, "loss": 0.4296, "lr": 0.00013615540294873585, "epoch": 1.4747332959011792, "percentage": 49.25, "elapsed_time": "15:46:30", "remaining_time": "16:15:21"}
165
+ {"current_steps": 165, "total_steps": 333, "loss": 0.4316, "lr": 0.00013499028684466692, "epoch": 1.4837170129140933, "percentage": 49.55, "elapsed_time": "15:52:11", "remaining_time": "16:09:30"}
166
+ {"current_steps": 166, "total_steps": 333, "loss": 0.4268, "lr": 0.00013382275822494612, "epoch": 1.4927007299270074, "percentage": 49.85, "elapsed_time": "15:57:47", "remaining_time": "16:03:33"}
167
+ {"current_steps": 167, "total_steps": 333, "loss": 0.4338, "lr": 0.00013265294598007347, "epoch": 1.5016844469399215, "percentage": 50.15, "elapsed_time": "16:03:26", "remaining_time": "15:57:40"}
168
+ {"current_steps": 168, "total_steps": 333, "loss": 0.4335, "lr": 0.00013148097925265212, "epoch": 1.5106681639528357, "percentage": 50.45, "elapsed_time": "16:09:03", "remaining_time": "15:51:44"}
169
+ {"current_steps": 169, "total_steps": 333, "loss": 0.4206, "lr": 0.00013030698742313152, "epoch": 1.5196518809657495, "percentage": 50.75, "elapsed_time": "16:14:50", "remaining_time": "15:45:59"}
170
+ {"current_steps": 170, "total_steps": 333, "loss": 0.4322, "lr": 0.00012913110009552428, "epoch": 1.5286355979786637, "percentage": 51.05, "elapsed_time": "16:20:50", "remaining_time": "15:40:27"}
171
+ {"current_steps": 171, "total_steps": 333, "loss": 0.4282, "lr": 0.0001279534470830984, "epoch": 1.5376193149915778, "percentage": 51.35, "elapsed_time": "16:26:29", "remaining_time": "15:34:34"}
172
+ {"current_steps": 172, "total_steps": 333, "loss": 0.4315, "lr": 0.00012677415839404646, "epoch": 1.546603032004492, "percentage": 51.65, "elapsed_time": "16:32:18", "remaining_time": "15:28:50"}
173
+ {"current_steps": 173, "total_steps": 333, "loss": 0.4255, "lr": 0.00012559336421713333, "epoch": 1.5555867490174058, "percentage": 51.95, "elapsed_time": "16:38:08", "remaining_time": "15:23:08"}
174
+ {"current_steps": 174, "total_steps": 333, "loss": 0.4197, "lr": 0.00012441119490732357, "epoch": 1.56457046603032, "percentage": 52.25, "elapsed_time": "16:44:01", "remaining_time": "15:17:28"}
175
+ {"current_steps": 175, "total_steps": 333, "loss": 0.4333, "lr": 0.00012322778097139102, "epoch": 1.573554183043234, "percentage": 52.55, "elapsed_time": "16:49:41", "remaining_time": "15:11:36"}
176
+ {"current_steps": 176, "total_steps": 333, "loss": 0.4327, "lr": 0.00012204325305351117, "epoch": 1.5825379000561481, "percentage": 52.85, "elapsed_time": "16:55:37", "remaining_time": "15:05:58"}
177
+ {"current_steps": 177, "total_steps": 333, "loss": 0.424, "lr": 0.00012085774192083878, "epoch": 1.5915216170690623, "percentage": 53.15, "elapsed_time": "17:01:25", "remaining_time": "15:00:14"}
178
+ {"current_steps": 178, "total_steps": 333, "loss": 0.4198, "lr": 0.00011967137844907157, "epoch": 1.6005053340819764, "percentage": 53.45, "elapsed_time": "17:07:12", "remaining_time": "14:54:28"}
179
+ {"current_steps": 179, "total_steps": 333, "loss": 0.4279, "lr": 0.00011848429360800205, "epoch": 1.6094890510948905, "percentage": 53.75, "elapsed_time": "17:12:54", "remaining_time": "14:48:38"}
180
+ {"current_steps": 180, "total_steps": 333, "loss": 0.4249, "lr": 0.00011729661844705912, "epoch": 1.6184727681078046, "percentage": 54.05, "elapsed_time": "17:18:17", "remaining_time": "14:42:32"}
181
+ {"current_steps": 181, "total_steps": 333, "loss": 0.4275, "lr": 0.00011610848408084054, "epoch": 1.6274564851207187, "percentage": 54.35, "elapsed_time": "17:24:03", "remaining_time": "14:36:46"}
182
+ {"current_steps": 182, "total_steps": 333, "loss": 0.4225, "lr": 0.0001149200216746385, "epoch": 1.6364402021336328, "percentage": 54.65, "elapsed_time": "17:29:30", "remaining_time": "14:30:45"}
183
+ {"current_steps": 183, "total_steps": 333, "loss": 0.4153, "lr": 0.00011373136242995958, "epoch": 1.645423919146547, "percentage": 54.95, "elapsed_time": "17:35:17", "remaining_time": "14:24:59"}
184
+ {"current_steps": 184, "total_steps": 333, "loss": 0.4164, "lr": 0.00011254263757004044, "epoch": 1.654407636159461, "percentage": 55.26, "elapsed_time": "17:41:01", "remaining_time": "14:19:12"}
185
+ {"current_steps": 185, "total_steps": 333, "loss": 0.4253, "lr": 0.00011135397832536151, "epoch": 1.6633913531723752, "percentage": 55.56, "elapsed_time": "17:46:50", "remaining_time": "14:13:28"}
186
+ {"current_steps": 186, "total_steps": 333, "loss": 0.4239, "lr": 0.00011016551591915949, "epoch": 1.6723750701852893, "percentage": 55.86, "elapsed_time": "17:52:35", "remaining_time": "14:07:41"}
187
+ {"current_steps": 187, "total_steps": 333, "loss": 0.4245, "lr": 0.0001089773815529409, "epoch": 1.6813587871982034, "percentage": 56.16, "elapsed_time": "17:58:25", "remaining_time": "14:01:58"}
188
+ {"current_steps": 188, "total_steps": 333, "loss": 0.4198, "lr": 0.00010778970639199795, "epoch": 1.6903425042111173, "percentage": 56.46, "elapsed_time": "18:04:38", "remaining_time": "13:56:33"}
189
+ {"current_steps": 189, "total_steps": 333, "loss": 0.4275, "lr": 0.00010660262155092845, "epoch": 1.6993262212240314, "percentage": 56.76, "elapsed_time": "18:10:16", "remaining_time": "13:50:41"}
190
+ {"current_steps": 190, "total_steps": 333, "loss": 0.4175, "lr": 0.00010541625807916123, "epoch": 1.7083099382369455, "percentage": 57.06, "elapsed_time": "18:15:59", "remaining_time": "13:44:52"}
191
+ {"current_steps": 191, "total_steps": 333, "loss": 0.4272, "lr": 0.00010423074694648884, "epoch": 1.7172936552498597, "percentage": 57.36, "elapsed_time": "18:22:00", "remaining_time": "13:39:17"}
192
+ {"current_steps": 192, "total_steps": 333, "loss": 0.4274, "lr": 0.00010304621902860899, "epoch": 1.7262773722627736, "percentage": 57.66, "elapsed_time": "18:27:56", "remaining_time": "13:33:38"}
193
+ {"current_steps": 193, "total_steps": 333, "loss": 0.4275, "lr": 0.00010186280509267643, "epoch": 1.7352610892756877, "percentage": 57.96, "elapsed_time": "18:33:59", "remaining_time": "13:28:04"}
194
+ {"current_steps": 194, "total_steps": 333, "loss": 0.4172, "lr": 0.00010068063578286667, "epoch": 1.7442448062886018, "percentage": 58.26, "elapsed_time": "18:39:53", "remaining_time": "13:22:23"}
195
+ {"current_steps": 195, "total_steps": 333, "loss": 0.4279, "lr": 9.949984160595352e-05, "epoch": 1.753228523301516, "percentage": 58.56, "elapsed_time": "18:45:43", "remaining_time": "13:16:40"}
196
+ {"current_steps": 196, "total_steps": 333, "loss": 0.4315, "lr": 9.832055291690164e-05, "epoch": 1.76221224031443, "percentage": 58.86, "elapsed_time": "18:51:31", "remaining_time": "13:10:54"}
197
+ {"current_steps": 197, "total_steps": 333, "loss": 0.4182, "lr": 9.714289990447578e-05, "epoch": 1.7711959573273441, "percentage": 59.16, "elapsed_time": "18:57:12", "remaining_time": "13:05:04"}
198
+ {"current_steps": 198, "total_steps": 333, "loss": 0.4119, "lr": 9.596701257686851e-05, "epoch": 1.7801796743402583, "percentage": 59.46, "elapsed_time": "19:02:59", "remaining_time": "12:59:18"}
199
+ {"current_steps": 199, "total_steps": 333, "loss": 0.4162, "lr": 9.479302074734792e-05, "epoch": 1.7891633913531724, "percentage": 59.76, "elapsed_time": "19:08:56", "remaining_time": "12:53:39"}
200
+ {"current_steps": 200, "total_steps": 333, "loss": 0.4177, "lr": 9.362105401992656e-05, "epoch": 1.7981471083660865, "percentage": 60.06, "elapsed_time": "19:14:41", "remaining_time": "12:47:51"}
201
+ {"current_steps": 201, "total_steps": 333, "loss": 0.421, "lr": 9.245124177505392e-05, "epoch": 1.8071308253790006, "percentage": 60.36, "elapsed_time": "19:20:30", "remaining_time": "12:42:07"}
202
+ {"current_steps": 202, "total_steps": 333, "loss": 0.434, "lr": 9.12837131553331e-05, "epoch": 1.8161145423919147, "percentage": 60.66, "elapsed_time": "19:26:21", "remaining_time": "12:36:23"}
203
+ {"current_steps": 203, "total_steps": 333, "loss": 0.418, "lr": 9.011859705126419e-05, "epoch": 1.8250982594048288, "percentage": 60.96, "elapsed_time": "19:32:10", "remaining_time": "12:30:39"}
204
+ {"current_steps": 204, "total_steps": 333, "loss": 0.4113, "lr": 8.895602208701511e-05, "epoch": 1.834081976417743, "percentage": 61.26, "elapsed_time": "19:38:00", "remaining_time": "12:24:55"}
205
+ {"current_steps": 205, "total_steps": 333, "loss": 0.4239, "lr": 8.779611660622215e-05, "epoch": 1.843065693430657, "percentage": 61.56, "elapsed_time": "19:43:50", "remaining_time": "12:19:10"}
206
+ {"current_steps": 206, "total_steps": 333, "loss": 0.4121, "lr": 8.66390086578212e-05, "epoch": 1.8520494104435712, "percentage": 61.86, "elapsed_time": "19:49:29", "remaining_time": "12:13:19"}
207
+ {"current_steps": 207, "total_steps": 333, "loss": 0.4193, "lr": 8.548482598191181e-05, "epoch": 1.861033127456485, "percentage": 62.16, "elapsed_time": "19:55:22", "remaining_time": "12:07:37"}
208
+ {"current_steps": 208, "total_steps": 333, "loss": 0.4296, "lr": 8.433369599565508e-05, "epoch": 1.8700168444693992, "percentage": 62.46, "elapsed_time": "20:00:59", "remaining_time": "12:01:44"}
209
+ {"current_steps": 209, "total_steps": 333, "loss": 0.4164, "lr": 8.318574577920736e-05, "epoch": 1.8790005614823133, "percentage": 62.76, "elapsed_time": "20:06:43", "remaining_time": "11:55:57"}
210
+ {"current_steps": 210, "total_steps": 333, "loss": 0.4172, "lr": 8.204110206169114e-05, "epoch": 1.8879842784952274, "percentage": 63.06, "elapsed_time": "20:12:26", "remaining_time": "11:50:08"}
211
+ {"current_steps": 211, "total_steps": 333, "loss": 0.4167, "lr": 8.08998912072046e-05, "epoch": 1.8969679955081415, "percentage": 63.36, "elapsed_time": "20:18:11", "remaining_time": "11:44:21"}
212
+ {"current_steps": 212, "total_steps": 333, "loss": 0.4247, "lr": 7.976223920087153e-05, "epoch": 1.9059517125210554, "percentage": 63.66, "elapsed_time": "20:24:15", "remaining_time": "11:38:44"}
213
+ {"current_steps": 213, "total_steps": 333, "loss": 0.4076, "lr": 7.86282716349331e-05, "epoch": 1.9149354295339696, "percentage": 63.96, "elapsed_time": "20:30:07", "remaining_time": "11:33:01"}
214
+ {"current_steps": 214, "total_steps": 333, "loss": 0.425, "lr": 7.749811369488296e-05, "epoch": 1.9239191465468837, "percentage": 64.26, "elapsed_time": "20:35:54", "remaining_time": "11:27:15"}
215
+ {"current_steps": 215, "total_steps": 333, "loss": 0.4152, "lr": 7.637189014564727e-05, "epoch": 1.9329028635597978, "percentage": 64.56, "elapsed_time": "20:41:40", "remaining_time": "11:21:28"}
216
+ {"current_steps": 216, "total_steps": 333, "loss": 0.4201, "lr": 7.524972531781114e-05, "epoch": 1.941886580572712, "percentage": 64.86, "elapsed_time": "20:47:13", "remaining_time": "11:15:34"}
217
+ {"current_steps": 217, "total_steps": 333, "loss": 0.4084, "lr": 7.413174309389303e-05, "epoch": 1.950870297585626, "percentage": 65.17, "elapsed_time": "20:53:00", "remaining_time": "11:09:48"}
218
+ {"current_steps": 218, "total_steps": 333, "loss": 0.4275, "lr": 7.301806689466864e-05, "epoch": 1.9598540145985401, "percentage": 65.47, "elapsed_time": "20:58:47", "remaining_time": "11:04:02"}
219
+ {"current_steps": 219, "total_steps": 333, "loss": 0.418, "lr": 7.190881966554573e-05, "epoch": 1.9688377316114543, "percentage": 65.77, "elapsed_time": "21:04:24", "remaining_time": "10:58:11"}
220
+ {"current_steps": 220, "total_steps": 333, "loss": 0.4141, "lr": 7.080412386299138e-05, "epoch": 1.9778214486243684, "percentage": 66.07, "elapsed_time": "21:10:10", "remaining_time": "10:52:24"}
221
+ {"current_steps": 221, "total_steps": 333, "loss": 0.4029, "lr": 6.970410144101348e-05, "epoch": 1.9868051656372825, "percentage": 66.37, "elapsed_time": "21:15:40", "remaining_time": "10:46:29"}
222
+ {"current_steps": 222, "total_steps": 333, "loss": 0.4266, "lr": 6.860887383769717e-05, "epoch": 1.9957888826501966, "percentage": 66.67, "elapsed_time": "21:21:40", "remaining_time": "10:40:50"}