Dr. Jorge Abreu Vicente commited on
Commit
50526a5
·
1 Parent(s): 2bfe9b0

Training in progress, step 2000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f8e0e79a7a83f8d6c5da3c1219d679a9f73e1a64f33535e1427c8b07d4efdcdd
3
  size 861965029
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63ed17cd5d69cfd14c439f9208e26666e5049a5f7c6be3ea47b308ff26c93cfa
3
  size 861965029
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1b54d1db48c390e2aa766827b4b778f34a81d18da384628bd6055b79f0089620
3
  size 431008241
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c32fa027261aa6406a0aa449c9993ac247bcab32a17c256ade795f1069197b67
3
  size 431008241
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6fa55671a3580107240d729cd7668202e19cfe9ced85cf63192c87c239366db8
3
  size 17563
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c0dcd6c769303cf359205c8d5160a859bbff9b742235db157eca3f13a64b6e5
3
  size 17563
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bcddb40dc24b0f5884040379936f3e8e69d7789af11443275c0d7c46029c5402
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9962220360679d8e10cf7e904b5520efefc5b243afdd605a267181a14c7f58b0
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 0.7458701475198578,
3
- "best_model_checkpoint": "./tokcl_models/EMBO_bert-base-cased_NER-task/checkpoint-1000",
4
- "epoch": 1.310615989515072,
5
- "global_step": 1000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -138,11 +138,143 @@
138
  "eval_samples_per_second": 123.99,
139
  "eval_steps_per_second": 0.97,
140
  "step": 1000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
141
  }
142
  ],
143
  "max_steps": 3815,
144
  "num_train_epochs": 5,
145
- "total_flos": 1.139953338400401e+16,
146
  "trial_name": null,
147
  "trial_params": null
148
  }
 
1
  {
2
+ "best_metric": 0.771723286444866,
3
+ "best_model_checkpoint": "./tokcl_models/EMBO_bert-base-cased_NER-task/checkpoint-2000",
4
+ "epoch": 2.621231979030144,
5
+ "global_step": 2000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
138
  "eval_samples_per_second": 123.99,
139
  "eval_steps_per_second": 0.97,
140
  "step": 1000
141
+ },
142
+ {
143
+ "epoch": 1.38,
144
+ "learning_rate": 0.00036238532110091746,
145
+ "loss": 0.1825,
146
+ "step": 1050
147
+ },
148
+ {
149
+ "epoch": 1.44,
150
+ "learning_rate": 0.0003558322411533421,
151
+ "loss": 0.1898,
152
+ "step": 1100
153
+ },
154
+ {
155
+ "epoch": 1.51,
156
+ "learning_rate": 0.0003492791612057667,
157
+ "loss": 0.1858,
158
+ "step": 1150
159
+ },
160
+ {
161
+ "epoch": 1.57,
162
+ "learning_rate": 0.0003427260812581914,
163
+ "loss": 0.182,
164
+ "step": 1200
165
+ },
166
+ {
167
+ "epoch": 1.64,
168
+ "learning_rate": 0.000336173001310616,
169
+ "loss": 0.1853,
170
+ "step": 1250
171
+ },
172
+ {
173
+ "epoch": 1.7,
174
+ "learning_rate": 0.0003296199213630406,
175
+ "loss": 0.1869,
176
+ "step": 1300
177
+ },
178
+ {
179
+ "epoch": 1.77,
180
+ "learning_rate": 0.0003230668414154653,
181
+ "loss": 0.1771,
182
+ "step": 1350
183
+ },
184
+ {
185
+ "epoch": 1.83,
186
+ "learning_rate": 0.0003165137614678899,
187
+ "loss": 0.1759,
188
+ "step": 1400
189
+ },
190
+ {
191
+ "epoch": 1.9,
192
+ "learning_rate": 0.00030996068152031454,
193
+ "loss": 0.1705,
194
+ "step": 1450
195
+ },
196
+ {
197
+ "epoch": 1.97,
198
+ "learning_rate": 0.00030340760157273916,
199
+ "loss": 0.1786,
200
+ "step": 1500
201
+ },
202
+ {
203
+ "epoch": 2.03,
204
+ "learning_rate": 0.00029685452162516384,
205
+ "loss": 0.1589,
206
+ "step": 1550
207
+ },
208
+ {
209
+ "epoch": 2.1,
210
+ "learning_rate": 0.00029030144167758846,
211
+ "loss": 0.1364,
212
+ "step": 1600
213
+ },
214
+ {
215
+ "epoch": 2.16,
216
+ "learning_rate": 0.00028374836173001314,
217
+ "loss": 0.1319,
218
+ "step": 1650
219
+ },
220
+ {
221
+ "epoch": 2.23,
222
+ "learning_rate": 0.00027719528178243776,
223
+ "loss": 0.1283,
224
+ "step": 1700
225
+ },
226
+ {
227
+ "epoch": 2.29,
228
+ "learning_rate": 0.0002706422018348624,
229
+ "loss": 0.1266,
230
+ "step": 1750
231
+ },
232
+ {
233
+ "epoch": 2.36,
234
+ "learning_rate": 0.000264089121887287,
235
+ "loss": 0.1359,
236
+ "step": 1800
237
+ },
238
+ {
239
+ "epoch": 2.42,
240
+ "learning_rate": 0.0002575360419397117,
241
+ "loss": 0.1271,
242
+ "step": 1850
243
+ },
244
+ {
245
+ "epoch": 2.49,
246
+ "learning_rate": 0.0002509829619921363,
247
+ "loss": 0.1328,
248
+ "step": 1900
249
+ },
250
+ {
251
+ "epoch": 2.56,
252
+ "learning_rate": 0.000244429882044561,
253
+ "loss": 0.1328,
254
+ "step": 1950
255
+ },
256
+ {
257
+ "epoch": 2.62,
258
+ "learning_rate": 0.0002378768020969856,
259
+ "loss": 0.138,
260
+ "step": 2000
261
+ },
262
+ {
263
+ "epoch": 2.62,
264
+ "eval_accuracy_score": 0.9121489075478695,
265
+ "eval_f1": 0.771723286444866,
266
+ "eval_loss": 0.2743813991546631,
267
+ "eval_precision": 0.751326535173136,
268
+ "eval_recall": 0.7932583890920736,
269
+ "eval_runtime": 111.6996,
270
+ "eval_samples_per_second": 123.555,
271
+ "eval_steps_per_second": 0.967,
272
+ "step": 2000
273
  }
274
  ],
275
  "max_steps": 3815,
276
  "num_train_epochs": 5,
277
+ "total_flos": 2.283293725774362e+16,
278
  "trial_name": null,
279
  "trial_params": null
280
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1b54d1db48c390e2aa766827b4b778f34a81d18da384628bd6055b79f0089620
3
  size 431008241
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c32fa027261aa6406a0aa449c9993ac247bcab32a17c256ade795f1069197b67
3
  size 431008241
runs/May20_12-43-43_9288e76c4417/events.out.tfevents.1653050648.9288e76c4417.830.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:83cbcf1822635c478dede77180c40bf9aa26892caa42abaf69351c9324581801
3
- size 7785
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63372c2b6f1aa18b43dd0c330803479732d2191a9edc3b644cf43dcc964e1c5a
3
+ size 11403