sedrickkeh commited on
Commit
d9f5ebe
·
verified ·
1 Parent(s): da50574

Training in progress, epoch 1

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4b2dc1373b0762e4448620b59fc90b002c281e6c016750718f64d58c6c68684d
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c05e9f1a309b38835ef1469af45f75649f1181f86c1b5b91a78f0cfb5df3b9d
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2b571377ec2bd4209af616d5e642c15d78a575ca27409d5b6ddb8f44cb321019
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:deb5d9229ec06f79df6eae25f5c8ea69eb5e9282f58fc97012d7c60faf6af6d7
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:558f6d3ae190289391e0049487fed767fd7a1c99e4f8c6f8a1c92f7dce8e77f1
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fec8ea31aa2a8e69566b511aca3bb3e495effe114c81a3d21041d8d32700472d
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1bff831f132d3cf15de84b1b54d5c1ea43045d9acedc8aec81d5641db98971a0
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e65ef19d1ed284fb4d22ea81cef0f8fa888e535bbcea7d6b6487f9625cf0c9b5
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -109,3 +109,114 @@
109
  {"current_steps": 109, "total_steps": 333, "loss": 0.4696, "lr": 0.0001364197561070856, "epoch": 0.9792251544076361, "percentage": 32.73, "elapsed_time": "10:31:35", "remaining_time": "21:37:56"}
110
  {"current_steps": 110, "total_steps": 333, "loss": 0.4775, "lr": 0.00013582072800594284, "epoch": 0.9882088714205502, "percentage": 33.03, "elapsed_time": "10:37:13", "remaining_time": "21:31:49"}
111
  {"current_steps": 111, "total_steps": 333, "loss": 0.4707, "lr": 0.00013521553751920693, "epoch": 0.9971925884334644, "percentage": 33.33, "elapsed_time": "10:43:00", "remaining_time": "21:26:01"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
109
  {"current_steps": 109, "total_steps": 333, "loss": 0.4696, "lr": 0.0001364197561070856, "epoch": 0.9792251544076361, "percentage": 32.73, "elapsed_time": "10:31:35", "remaining_time": "21:37:56"}
110
  {"current_steps": 110, "total_steps": 333, "loss": 0.4775, "lr": 0.00013582072800594284, "epoch": 0.9882088714205502, "percentage": 33.03, "elapsed_time": "10:37:13", "remaining_time": "21:31:49"}
111
  {"current_steps": 111, "total_steps": 333, "loss": 0.4707, "lr": 0.00013521553751920693, "epoch": 0.9971925884334644, "percentage": 33.33, "elapsed_time": "10:43:00", "remaining_time": "21:26:01"}
112
+ {"current_steps": 112, "total_steps": 333, "loss": 0.8319, "lr": 0.00013460425145749236, "epoch": 1.0075800112296462, "percentage": 33.63, "elapsed_time": "10:49:37", "remaining_time": "21:21:51"}
113
+ {"current_steps": 113, "total_steps": 333, "loss": 0.4451, "lr": 0.00013398693730434062, "epoch": 1.0165637282425604, "percentage": 33.93, "elapsed_time": "10:55:24", "remaining_time": "21:16:00"}
114
+ {"current_steps": 114, "total_steps": 333, "loss": 0.448, "lr": 0.00013336366320877062, "epoch": 1.0255474452554745, "percentage": 34.23, "elapsed_time": "11:01:01", "remaining_time": "21:09:50"}
115
+ {"current_steps": 115, "total_steps": 333, "loss": 0.4648, "lr": 0.00013273449797775503, "epoch": 1.0345311622683886, "percentage": 34.53, "elapsed_time": "11:06:42", "remaining_time": "21:03:50"}
116
+ {"current_steps": 116, "total_steps": 333, "loss": 0.4656, "lr": 0.00013209951106862437, "epoch": 1.0435148792813027, "percentage": 34.83, "elapsed_time": "11:12:30", "remaining_time": "20:58:02"}
117
+ {"current_steps": 117, "total_steps": 333, "loss": 0.457, "lr": 0.00013145877258139918, "epoch": 1.0524985962942168, "percentage": 35.14, "elapsed_time": "11:18:10", "remaining_time": "20:52:00"}
118
+ {"current_steps": 118, "total_steps": 333, "loss": 0.465, "lr": 0.0001308123532510513, "epoch": 1.0614823133071307, "percentage": 35.44, "elapsed_time": "11:24:04", "remaining_time": "20:46:23"}
119
+ {"current_steps": 119, "total_steps": 333, "loss": 0.4457, "lr": 0.00013016032443969493, "epoch": 1.0704660303200448, "percentage": 35.74, "elapsed_time": "11:29:37", "remaining_time": "20:40:09"}
120
+ {"current_steps": 120, "total_steps": 333, "loss": 0.4472, "lr": 0.0001295027581287087, "epoch": 1.079449747332959, "percentage": 36.04, "elapsed_time": "11:35:01", "remaining_time": "20:33:39"}
121
+ {"current_steps": 121, "total_steps": 333, "loss": 0.4509, "lr": 0.00012883972691078892, "epoch": 1.088433464345873, "percentage": 36.34, "elapsed_time": "11:40:50", "remaining_time": "20:27:55"}
122
+ {"current_steps": 122, "total_steps": 333, "loss": 0.4389, "lr": 0.00012817130398193595, "epoch": 1.0974171813587872, "percentage": 36.64, "elapsed_time": "11:46:47", "remaining_time": "20:22:23"}
123
+ {"current_steps": 123, "total_steps": 333, "loss": 0.4552, "lr": 0.00012749756313337353, "epoch": 1.1064008983717013, "percentage": 36.94, "elapsed_time": "11:52:28", "remaining_time": "20:16:25"}
124
+ {"current_steps": 124, "total_steps": 333, "loss": 0.431, "lr": 0.00012681857874340235, "epoch": 1.1153846153846154, "percentage": 37.24, "elapsed_time": "11:58:14", "remaining_time": "20:10:35"}
125
+ {"current_steps": 125, "total_steps": 333, "loss": 0.4577, "lr": 0.0001261344257691894, "epoch": 1.1243683323975295, "percentage": 37.54, "elapsed_time": "12:03:51", "remaining_time": "20:04:29"}
126
+ {"current_steps": 126, "total_steps": 333, "loss": 0.4267, "lr": 0.00012544517973849247, "epoch": 1.1333520494104437, "percentage": 37.84, "elapsed_time": "12:09:27", "remaining_time": "19:58:23"}
127
+ {"current_steps": 127, "total_steps": 333, "loss": 0.4422, "lr": 0.00012475091674132266, "epoch": 1.1423357664233578, "percentage": 38.14, "elapsed_time": "12:15:09", "remaining_time": "19:52:28"}
128
+ {"current_steps": 128, "total_steps": 333, "loss": 0.431, "lr": 0.00012405171342154409, "epoch": 1.1513194834362717, "percentage": 38.44, "elapsed_time": "12:20:58", "remaining_time": "19:46:43"}
129
+ {"current_steps": 129, "total_steps": 333, "loss": 0.4439, "lr": 0.00012334764696841273, "epoch": 1.1603032004491858, "percentage": 38.74, "elapsed_time": "12:26:42", "remaining_time": "19:40:50"}
130
+ {"current_steps": 130, "total_steps": 333, "loss": 0.4351, "lr": 0.0001226387951080551, "epoch": 1.1692869174621, "percentage": 39.04, "elapsed_time": "12:32:31", "remaining_time": "19:35:05"}
131
+ {"current_steps": 131, "total_steps": 333, "loss": 0.4355, "lr": 0.0001219252360948876, "epoch": 1.178270634475014, "percentage": 39.34, "elapsed_time": "12:38:23", "remaining_time": "19:29:25"}
132
+ {"current_steps": 132, "total_steps": 333, "loss": 0.4339, "lr": 0.00012120704870297748, "epoch": 1.1872543514879281, "percentage": 39.64, "elapsed_time": "12:44:15", "remaining_time": "19:23:46"}
133
+ {"current_steps": 133, "total_steps": 333, "loss": 0.4342, "lr": 0.00012048431221734653, "epoch": 1.1962380685008422, "percentage": 39.94, "elapsed_time": "12:50:06", "remaining_time": "19:18:03"}
134
+ {"current_steps": 134, "total_steps": 333, "loss": 0.4296, "lr": 0.00011975710642521837, "epoch": 1.2052217855137564, "percentage": 40.24, "elapsed_time": "12:55:47", "remaining_time": "19:12:07"}
135
+ {"current_steps": 135, "total_steps": 333, "loss": 0.4305, "lr": 0.0001190255116072102, "epoch": 1.2142055025266705, "percentage": 40.54, "elapsed_time": "13:01:22", "remaining_time": "19:06:01"}
136
+ {"current_steps": 136, "total_steps": 333, "loss": 0.4302, "lr": 0.00011828960852847013, "epoch": 1.2231892195395846, "percentage": 40.84, "elapsed_time": "13:06:58", "remaining_time": "18:59:58"}
137
+ {"current_steps": 137, "total_steps": 333, "loss": 0.4336, "lr": 0.00011754947842976111, "epoch": 1.2321729365524985, "percentage": 41.14, "elapsed_time": "13:12:27", "remaining_time": "18:53:44"}
138
+ {"current_steps": 138, "total_steps": 333, "loss": 0.4306, "lr": 0.00011680520301849219, "epoch": 1.2411566535654126, "percentage": 41.44, "elapsed_time": "13:18:05", "remaining_time": "18:47:44"}
139
+ {"current_steps": 139, "total_steps": 333, "loss": 0.4303, "lr": 0.00011605686445969838, "epoch": 1.2501403705783267, "percentage": 41.74, "elapsed_time": "13:23:58", "remaining_time": "18:42:06"}
140
+ {"current_steps": 140, "total_steps": 333, "loss": 0.429, "lr": 0.00011530454536697001, "epoch": 1.2591240875912408, "percentage": 42.04, "elapsed_time": "13:29:34", "remaining_time": "18:36:03"}
141
+ {"current_steps": 141, "total_steps": 333, "loss": 0.4311, "lr": 0.00011454832879333245, "epoch": 1.268107804604155, "percentage": 42.34, "elapsed_time": "13:35:16", "remaining_time": "18:30:09"}
142
+ {"current_steps": 142, "total_steps": 333, "loss": 0.4281, "lr": 0.00011378829822207734, "epoch": 1.277091521617069, "percentage": 42.64, "elapsed_time": "13:41:22", "remaining_time": "18:24:48"}
143
+ {"current_steps": 143, "total_steps": 333, "loss": 0.4303, "lr": 0.00011302453755754653, "epoch": 1.2860752386299832, "percentage": 42.94, "elapsed_time": "13:46:49", "remaining_time": "18:18:35"}
144
+ {"current_steps": 144, "total_steps": 333, "loss": 0.4354, "lr": 0.00011225713111586919, "epoch": 1.2950589556428973, "percentage": 43.24, "elapsed_time": "13:52:38", "remaining_time": "18:12:49"}
145
+ {"current_steps": 145, "total_steps": 333, "loss": 0.4176, "lr": 0.00011148616361565386, "epoch": 1.3040426726558114, "percentage": 43.54, "elapsed_time": "13:58:25", "remaining_time": "18:07:03"}
146
+ {"current_steps": 146, "total_steps": 333, "loss": 0.4299, "lr": 0.00011071172016863557, "epoch": 1.3130263896687255, "percentage": 43.84, "elapsed_time": "14:04:26", "remaining_time": "18:01:34"}
147
+ {"current_steps": 147, "total_steps": 333, "loss": 0.4304, "lr": 0.00010993388627028018, "epoch": 1.3220101066816397, "percentage": 44.14, "elapsed_time": "14:10:09", "remaining_time": "17:55:43"}
148
+ {"current_steps": 148, "total_steps": 333, "loss": 0.4332, "lr": 0.0001091527477903457, "epoch": 1.3309938236945535, "percentage": 44.44, "elapsed_time": "14:16:10", "remaining_time": "17:50:12"}
149
+ {"current_steps": 149, "total_steps": 333, "loss": 0.4209, "lr": 0.00010836839096340285, "epoch": 1.3399775407074677, "percentage": 44.74, "elapsed_time": "14:22:18", "remaining_time": "17:44:51"}
150
+ {"current_steps": 150, "total_steps": 333, "loss": 0.4283, "lr": 0.00010758090237931497, "epoch": 1.3489612577203818, "percentage": 45.05, "elapsed_time": "14:28:14", "remaining_time": "17:39:15"}
151
+ {"current_steps": 151, "total_steps": 333, "loss": 0.4263, "lr": 0.0001067903689736789, "epoch": 1.357944974733296, "percentage": 45.35, "elapsed_time": "14:33:58", "remaining_time": "17:33:23"}
152
+ {"current_steps": 152, "total_steps": 333, "loss": 0.4141, "lr": 0.00010599687801822763, "epoch": 1.36692869174621, "percentage": 45.65, "elapsed_time": "14:39:36", "remaining_time": "17:27:26"}
153
+ {"current_steps": 153, "total_steps": 333, "loss": 0.4202, "lr": 0.00010520051711119585, "epoch": 1.3759124087591241, "percentage": 45.95, "elapsed_time": "14:45:18", "remaining_time": "17:21:32"}
154
+ {"current_steps": 154, "total_steps": 333, "loss": 0.4227, "lr": 0.00010440137416764941, "epoch": 1.3848961257720382, "percentage": 46.25, "elapsed_time": "14:51:00", "remaining_time": "17:15:39"}
155
+ {"current_steps": 155, "total_steps": 333, "loss": 0.4163, "lr": 0.00010359953740977998, "epoch": 1.3938798427849521, "percentage": 46.55, "elapsed_time": "14:56:44", "remaining_time": "17:09:47"}
156
+ {"current_steps": 156, "total_steps": 333, "loss": 0.4141, "lr": 0.00010279509535716549, "epoch": 1.4028635597978663, "percentage": 46.85, "elapsed_time": "15:02:27", "remaining_time": "17:03:56"}
157
+ {"current_steps": 157, "total_steps": 333, "loss": 0.4276, "lr": 0.00010198813681699804, "epoch": 1.4118472768107804, "percentage": 47.15, "elapsed_time": "15:08:21", "remaining_time": "16:58:17"}
158
+ {"current_steps": 158, "total_steps": 333, "loss": 0.4168, "lr": 0.00010117875087427998, "epoch": 1.4208309938236945, "percentage": 47.45, "elapsed_time": "15:14:13", "remaining_time": "16:52:35"}
159
+ {"current_steps": 159, "total_steps": 333, "loss": 0.4309, "lr": 0.00010036702688198906, "epoch": 1.4298147108366086, "percentage": 47.75, "elapsed_time": "15:19:59", "remaining_time": "16:46:47"}
160
+ {"current_steps": 160, "total_steps": 333, "loss": 0.4269, "lr": 9.955305445121455e-05, "epoch": 1.4387984278495227, "percentage": 48.05, "elapsed_time": "15:25:46", "remaining_time": "16:40:59"}
161
+ {"current_steps": 161, "total_steps": 333, "loss": 0.4284, "lr": 9.87369234412642e-05, "epoch": 1.4477821448624368, "percentage": 48.35, "elapsed_time": "15:31:37", "remaining_time": "16:35:16"}
162
+ {"current_steps": 162, "total_steps": 333, "loss": 0.4333, "lr": 9.79187239497444e-05, "epoch": 1.456765861875351, "percentage": 48.65, "elapsed_time": "15:37:17", "remaining_time": "16:29:22"}
163
+ {"current_steps": 163, "total_steps": 333, "loss": 0.427, "lr": 9.709854630261359e-05, "epoch": 1.465749578888265, "percentage": 48.95, "elapsed_time": "15:43:14", "remaining_time": "16:23:44"}
164
+ {"current_steps": 164, "total_steps": 333, "loss": 0.4221, "lr": 9.627648104421073e-05, "epoch": 1.4747332959011792, "percentage": 49.25, "elapsed_time": "15:49:00", "remaining_time": "16:17:56"}
165
+ {"current_steps": 165, "total_steps": 333, "loss": 0.4247, "lr": 9.545261892725947e-05, "epoch": 1.4837170129140933, "percentage": 49.55, "elapsed_time": "15:54:43", "remaining_time": "16:12:04"}
166
+ {"current_steps": 166, "total_steps": 333, "loss": 0.4202, "lr": 9.462705090284956e-05, "epoch": 1.4927007299270074, "percentage": 49.85, "elapsed_time": "16:00:18", "remaining_time": "16:06:05"}
167
+ {"current_steps": 167, "total_steps": 333, "loss": 0.4271, "lr": 9.379986811039604e-05, "epoch": 1.5016844469399215, "percentage": 50.15, "elapsed_time": "16:05:59", "remaining_time": "16:00:11"}
168
+ {"current_steps": 168, "total_steps": 333, "loss": 0.4289, "lr": 9.297116186757798e-05, "epoch": 1.5106681639528357, "percentage": 50.45, "elapsed_time": "16:11:36", "remaining_time": "15:54:15"}
169
+ {"current_steps": 169, "total_steps": 333, "loss": 0.4186, "lr": 9.214102366025724e-05, "epoch": 1.5196518809657495, "percentage": 50.75, "elapsed_time": "16:17:23", "remaining_time": "15:48:28"}
170
+ {"current_steps": 170, "total_steps": 333, "loss": 0.4295, "lr": 9.130954513237883e-05, "epoch": 1.5286355979786637, "percentage": 51.05, "elapsed_time": "16:23:23", "remaining_time": "15:42:54"}
171
+ {"current_steps": 171, "total_steps": 333, "loss": 0.4238, "lr": 9.047681807585381e-05, "epoch": 1.5376193149915778, "percentage": 51.35, "elapsed_time": "16:29:02", "remaining_time": "15:36:58"}
172
+ {"current_steps": 172, "total_steps": 333, "loss": 0.427, "lr": 8.964293442042585e-05, "epoch": 1.546603032004492, "percentage": 51.65, "elapsed_time": "16:34:51", "remaining_time": "15:31:14"}
173
+ {"current_steps": 173, "total_steps": 333, "loss": 0.4221, "lr": 8.880798622352253e-05, "epoch": 1.5555867490174058, "percentage": 51.95, "elapsed_time": "16:40:43", "remaining_time": "15:25:31"}
174
+ {"current_steps": 174, "total_steps": 333, "loss": 0.4157, "lr": 8.797206566009252e-05, "epoch": 1.56457046603032, "percentage": 52.25, "elapsed_time": "16:46:37", "remaining_time": "15:19:50"}
175
+ {"current_steps": 175, "total_steps": 333, "loss": 0.4287, "lr": 8.713526501242991e-05, "epoch": 1.573554183043234, "percentage": 52.55, "elapsed_time": "16:52:17", "remaining_time": "15:13:57"}
176
+ {"current_steps": 176, "total_steps": 333, "loss": 0.428, "lr": 8.629767665998652e-05, "epoch": 1.5825379000561481, "percentage": 52.85, "elapsed_time": "16:58:13", "remaining_time": "15:08:18"}
177
+ {"current_steps": 177, "total_steps": 333, "loss": 0.419, "lr": 8.54593930691737e-05, "epoch": 1.5915216170690623, "percentage": 53.15, "elapsed_time": "17:04:01", "remaining_time": "15:02:32"}
178
+ {"current_steps": 178, "total_steps": 333, "loss": 0.4149, "lr": 8.462050678315429e-05, "epoch": 1.6005053340819764, "percentage": 53.45, "elapsed_time": "17:09:49", "remaining_time": "14:56:45"}
179
+ {"current_steps": 179, "total_steps": 333, "loss": 0.4229, "lr": 8.37811104116263e-05, "epoch": 1.6094890510948905, "percentage": 53.75, "elapsed_time": "17:15:32", "remaining_time": "14:50:54"}
180
+ {"current_steps": 180, "total_steps": 333, "loss": 0.4203, "lr": 8.294129662059918e-05, "epoch": 1.6184727681078046, "percentage": 54.05, "elapsed_time": "17:20:57", "remaining_time": "14:44:48"}
181
+ {"current_steps": 181, "total_steps": 333, "loss": 0.4236, "lr": 8.210115812216378e-05, "epoch": 1.6274564851207187, "percentage": 54.35, "elapsed_time": "17:26:45", "remaining_time": "14:39:02"}
182
+ {"current_steps": 182, "total_steps": 333, "loss": 0.4168, "lr": 8.126078766425732e-05, "epoch": 1.6364402021336328, "percentage": 54.65, "elapsed_time": "17:32:12", "remaining_time": "14:32:59"}
183
+ {"current_steps": 183, "total_steps": 333, "loss": 0.4112, "lr": 8.04202780204245e-05, "epoch": 1.645423919146547, "percentage": 54.95, "elapsed_time": "17:37:59", "remaining_time": "14:27:12"}
184
+ {"current_steps": 184, "total_steps": 333, "loss": 0.4119, "lr": 7.957972197957554e-05, "epoch": 1.654407636159461, "percentage": 55.26, "elapsed_time": "17:43:43", "remaining_time": "14:21:23"}
185
+ {"current_steps": 185, "total_steps": 333, "loss": 0.4208, "lr": 7.87392123357427e-05, "epoch": 1.6633913531723752, "percentage": 55.56, "elapsed_time": "17:49:34", "remaining_time": "14:15:39"}
186
+ {"current_steps": 186, "total_steps": 333, "loss": 0.4199, "lr": 7.789884187783625e-05, "epoch": 1.6723750701852893, "percentage": 55.86, "elapsed_time": "17:55:21", "remaining_time": "14:09:52"}
187
+ {"current_steps": 187, "total_steps": 333, "loss": 0.419, "lr": 7.705870337940085e-05, "epoch": 1.6813587871982034, "percentage": 56.16, "elapsed_time": "18:01:10", "remaining_time": "14:04:07"}
188
+ {"current_steps": 188, "total_steps": 333, "loss": 0.4156, "lr": 7.621888958837372e-05, "epoch": 1.6903425042111173, "percentage": 56.46, "elapsed_time": "18:07:23", "remaining_time": "13:58:41"}
189
+ {"current_steps": 189, "total_steps": 333, "loss": 0.4227, "lr": 7.537949321684574e-05, "epoch": 1.6993262212240314, "percentage": 56.76, "elapsed_time": "18:13:04", "remaining_time": "13:52:49"}
190
+ {"current_steps": 190, "total_steps": 333, "loss": 0.4128, "lr": 7.454060693082634e-05, "epoch": 1.7083099382369455, "percentage": 57.06, "elapsed_time": "18:18:47", "remaining_time": "13:46:58"}
191
+ {"current_steps": 191, "total_steps": 333, "loss": 0.4225, "lr": 7.37023233400135e-05, "epoch": 1.7172936552498597, "percentage": 57.36, "elapsed_time": "18:24:49", "remaining_time": "13:41:22"}
192
+ {"current_steps": 192, "total_steps": 333, "loss": 0.4224, "lr": 7.286473498757011e-05, "epoch": 1.7262773722627736, "percentage": 57.66, "elapsed_time": "18:30:47", "remaining_time": "13:35:44"}
193
+ {"current_steps": 193, "total_steps": 333, "loss": 0.4222, "lr": 7.20279343399075e-05, "epoch": 1.7352610892756877, "percentage": 57.96, "elapsed_time": "18:36:51", "remaining_time": "13:30:09"}
194
+ {"current_steps": 194, "total_steps": 333, "loss": 0.4131, "lr": 7.11920137764775e-05, "epoch": 1.7442448062886018, "percentage": 58.26, "elapsed_time": "18:42:46", "remaining_time": "13:24:28"}
195
+ {"current_steps": 195, "total_steps": 333, "loss": 0.4234, "lr": 7.035706557957416e-05, "epoch": 1.753228523301516, "percentage": 58.56, "elapsed_time": "18:48:37", "remaining_time": "13:18:43"}
196
+ {"current_steps": 196, "total_steps": 333, "loss": 0.4274, "lr": 6.952318192414623e-05, "epoch": 1.76221224031443, "percentage": 58.86, "elapsed_time": "18:54:24", "remaining_time": "13:12:56"}
197
+ {"current_steps": 197, "total_steps": 333, "loss": 0.4138, "lr": 6.869045486762122e-05, "epoch": 1.7711959573273441, "percentage": 59.16, "elapsed_time": "19:00:06", "remaining_time": "13:07:04"}
198
+ {"current_steps": 198, "total_steps": 333, "loss": 0.4073, "lr": 6.78589763397428e-05, "epoch": 1.7801796743402583, "percentage": 59.46, "elapsed_time": "19:05:54", "remaining_time": "13:01:18"}
199
+ {"current_steps": 199, "total_steps": 333, "loss": 0.4113, "lr": 6.702883813242205e-05, "epoch": 1.7891633913531724, "percentage": 59.76, "elapsed_time": "19:11:52", "remaining_time": "12:55:38"}
200
+ {"current_steps": 200, "total_steps": 333, "loss": 0.4129, "lr": 6.620013188960398e-05, "epoch": 1.7981471083660865, "percentage": 60.06, "elapsed_time": "19:17:37", "remaining_time": "12:49:49"}
201
+ {"current_steps": 201, "total_steps": 333, "loss": 0.4163, "lr": 6.537294909715048e-05, "epoch": 1.8071308253790006, "percentage": 60.36, "elapsed_time": "19:23:26", "remaining_time": "12:44:03"}
202
+ {"current_steps": 202, "total_steps": 333, "loss": 0.4292, "lr": 6.454738107274056e-05, "epoch": 1.8161145423919147, "percentage": 60.66, "elapsed_time": "19:29:18", "remaining_time": "12:38:18"}
203
+ {"current_steps": 203, "total_steps": 333, "loss": 0.4134, "lr": 6.372351895578931e-05, "epoch": 1.8250982594048288, "percentage": 60.96, "elapsed_time": "19:35:08", "remaining_time": "12:32:33"}
204
+ {"current_steps": 204, "total_steps": 333, "loss": 0.4078, "lr": 6.290145369738644e-05, "epoch": 1.834081976417743, "percentage": 61.26, "elapsed_time": "19:40:59", "remaining_time": "12:26:47"}
205
+ {"current_steps": 205, "total_steps": 333, "loss": 0.4193, "lr": 6.208127605025564e-05, "epoch": 1.843065693430657, "percentage": 61.56, "elapsed_time": "19:46:49", "remaining_time": "12:21:02"}
206
+ {"current_steps": 206, "total_steps": 333, "loss": 0.4076, "lr": 6.126307655873584e-05, "epoch": 1.8520494104435712, "percentage": 61.86, "elapsed_time": "19:52:28", "remaining_time": "12:15:10"}
207
+ {"current_steps": 207, "total_steps": 333, "loss": 0.4151, "lr": 6.0446945548785506e-05, "epoch": 1.861033127456485, "percentage": 62.16, "elapsed_time": "19:58:21", "remaining_time": "12:09:26"}
208
+ {"current_steps": 208, "total_steps": 333, "loss": 0.4248, "lr": 5.9632973118010964e-05, "epoch": 1.8700168444693992, "percentage": 62.46, "elapsed_time": "20:03:59", "remaining_time": "12:03:33"}
209
+ {"current_steps": 209, "total_steps": 333, "loss": 0.4125, "lr": 5.882124912572005e-05, "epoch": 1.8790005614823133, "percentage": 62.76, "elapsed_time": "20:09:45", "remaining_time": "11:57:45"}
210
+ {"current_steps": 210, "total_steps": 333, "loss": 0.4122, "lr": 5.801186318300195e-05, "epoch": 1.8879842784952274, "percentage": 63.06, "elapsed_time": "20:15:29", "remaining_time": "11:51:55"}
211
+ {"current_steps": 211, "total_steps": 333, "loss": 0.4124, "lr": 5.720490464283452e-05, "epoch": 1.8969679955081415, "percentage": 63.36, "elapsed_time": "20:21:15", "remaining_time": "11:46:07"}
212
+ {"current_steps": 212, "total_steps": 333, "loss": 0.4213, "lr": 5.6400462590220024e-05, "epoch": 1.9059517125210554, "percentage": 63.66, "elapsed_time": "20:27:21", "remaining_time": "11:40:31"}
213
+ {"current_steps": 213, "total_steps": 333, "loss": 0.4032, "lr": 5.559862583235059e-05, "epoch": 1.9149354295339696, "percentage": 63.96, "elapsed_time": "20:33:13", "remaining_time": "11:34:46"}
214
+ {"current_steps": 214, "total_steps": 333, "loss": 0.4214, "lr": 5.4799482888804174e-05, "epoch": 1.9239191465468837, "percentage": 64.26, "elapsed_time": "20:39:01", "remaining_time": "11:28:59"}
215
+ {"current_steps": 215, "total_steps": 333, "loss": 0.4116, "lr": 5.400312198177239e-05, "epoch": 1.9329028635597978, "percentage": 64.56, "elapsed_time": "20:44:48", "remaining_time": "11:23:11"}
216
+ {"current_steps": 216, "total_steps": 333, "loss": 0.4153, "lr": 5.320963102632111e-05, "epoch": 1.941886580572712, "percentage": 64.86, "elapsed_time": "20:50:21", "remaining_time": "11:17:16"}
217
+ {"current_steps": 217, "total_steps": 333, "loss": 0.4047, "lr": 5.2419097620685035e-05, "epoch": 1.950870297585626, "percentage": 65.17, "elapsed_time": "20:56:09", "remaining_time": "11:11:29"}
218
+ {"current_steps": 218, "total_steps": 333, "loss": 0.4234, "lr": 5.163160903659715e-05, "epoch": 1.9598540145985401, "percentage": 65.47, "elapsed_time": "21:01:58", "remaining_time": "11:05:43"}
219
+ {"current_steps": 219, "total_steps": 333, "loss": 0.4143, "lr": 5.08472522096543e-05, "epoch": 1.9688377316114543, "percentage": 65.77, "elapsed_time": "21:07:37", "remaining_time": "10:59:51"}
220
+ {"current_steps": 220, "total_steps": 333, "loss": 0.4106, "lr": 5.006611372971982e-05, "epoch": 1.9778214486243684, "percentage": 66.07, "elapsed_time": "21:13:25", "remaining_time": "10:54:04"}
221
+ {"current_steps": 221, "total_steps": 333, "loss": 0.3995, "lr": 4.928827983136444e-05, "epoch": 1.9868051656372825, "percentage": 66.37, "elapsed_time": "21:18:56", "remaining_time": "10:48:09"}
222
+ {"current_steps": 222, "total_steps": 333, "loss": 0.4229, "lr": 4.8513836384346175e-05, "epoch": 1.9957888826501966, "percentage": 66.67, "elapsed_time": "21:24:56", "remaining_time": "10:42:28"}