ShengdingHu commited on
Commit
fff6232
·
1 Parent(s): e5b0b79

Training in progress, step 200

Browse files
all_results.json CHANGED
@@ -1,20 +1,20 @@
1
  {
2
  "epoch": 3.0,
3
- "eval_average_metrics": 90.63138686131387,
4
- "eval_em": 90.36496350364963,
5
- "eval_f1": 90.89781021897811,
6
- "eval_loss": 0.2141435146331787,
7
- "eval_runtime": 15.7609,
8
- "eval_samples_per_second": 86.924,
9
- "test_average_metrics": 74.47490712152019,
10
- "test_em": 73.99182920400632,
11
- "test_f1": 74.95798503903406,
12
- "test_loss": 0.48021578788757324,
13
- "test_runtime": 161.768,
14
- "test_samples_per_second": 93.813,
15
- "train_loss": 0.3297047741756515,
16
- "train_runtime": 5659.5381,
17
  "train_samples": 137484,
18
- "train_samples_per_second": 72.877,
19
- "train_steps_per_second": 4.555
20
  }
 
1
  {
2
  "epoch": 3.0,
3
+ "eval_average_metrics": 91.36131386861314,
4
+ "eval_em": 91.0948905109489,
5
+ "eval_f1": 91.62773722627739,
6
+ "eval_loss": 0.21504777669906616,
7
+ "eval_runtime": 32.7505,
8
+ "eval_samples_per_second": 41.831,
9
+ "test_average_metrics": 75.00792291086177,
10
+ "test_em": 74.50579862941487,
11
+ "test_f1": 75.51004719230866,
12
+ "test_loss": 0.48300713300704956,
13
+ "test_runtime": 342.8147,
14
+ "test_samples_per_second": 44.269,
15
+ "train_loss": 0.3175360437943145,
16
+ "train_runtime": 17672.1841,
17
  "train_samples": 137484,
18
+ "train_samples_per_second": 23.339,
19
+ "train_steps_per_second": 1.459
20
  }
eval_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "epoch": 3.0,
3
- "eval_average_metrics": 90.63138686131387,
4
- "eval_em": 90.36496350364963,
5
- "eval_f1": 90.89781021897811,
6
- "eval_loss": 0.2141435146331787,
7
- "eval_runtime": 15.7609,
8
- "eval_samples_per_second": 86.924
9
  }
 
1
  {
2
  "epoch": 3.0,
3
+ "eval_average_metrics": 91.36131386861314,
4
+ "eval_em": 91.0948905109489,
5
+ "eval_f1": 91.62773722627739,
6
+ "eval_loss": 0.21504777669906616,
7
+ "eval_runtime": 32.7505,
8
+ "eval_samples_per_second": 41.831
9
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e8ace9158b4ccbc5041040d01c8ebdd84c66838368f240b1990392deb3dd5139
3
- size 7551621
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73bb270c9eb59d9f8a29f0bc108b1a26a26964434e7c8e43708ee7b37a511790
3
+ size 2631685
runs/Feb01_01-41-55_node1/events.out.tfevents.1643651046.node1 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8b890bc2228a1105ec12abd606bd641c665556eb421c44827cc0fb330c331aae
3
- size 58695
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6c57d4a2a5d00b66d8713b9942e1625bfc930480ae2c78809d0534326af5a44
3
+ size 59424
runs/Feb01_01-41-55_node1/events.out.tfevents.1643668752.node1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ee097214c3435788d0149fdfe0d0613c4683aa80f0538d0be9deaedca10c049
3
+ size 778
runs/Feb02_15-54-46_node1/1643788552.5548458/events.out.tfevents.1643788552.node1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:427de076ab994390934567ade01150a3a1e5ba6cd2847dd5851a17cd3d1506af
3
+ size 5047
runs/Feb02_15-54-46_node1/events.out.tfevents.1643788552.node1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84ff116273de9d30f8e85b06aaf6d6da8f411a96c210e7073f295f39f89a946b
3
+ size 4335
test_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "epoch": 3.0,
3
- "test_average_metrics": 74.47490712152019,
4
- "test_em": 73.99182920400632,
5
- "test_f1": 74.95798503903406,
6
- "test_loss": 0.48021578788757324,
7
- "test_runtime": 161.768,
8
- "test_samples_per_second": 93.813
9
  }
 
1
  {
2
  "epoch": 3.0,
3
+ "test_average_metrics": 75.00792291086177,
4
+ "test_em": 74.50579862941487,
5
+ "test_f1": 75.51004719230866,
6
+ "test_loss": 0.48300713300704956,
7
+ "test_runtime": 342.8147,
8
+ "test_samples_per_second": 44.269
9
  }
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 3.0,
3
- "train_loss": 0.3297047741756515,
4
- "train_runtime": 5659.5381,
5
  "train_samples": 137484,
6
- "train_samples_per_second": 72.877,
7
- "train_steps_per_second": 4.555
8
  }
 
1
  {
2
  "epoch": 3.0,
3
+ "train_loss": 0.3175360437943145,
4
+ "train_runtime": 17672.1841,
5
  "train_samples": 137484,
6
+ "train_samples_per_second": 23.339,
7
+ "train_steps_per_second": 1.459
8
  }
trainer_state.json CHANGED
@@ -1,841 +1,1611 @@
1
  {
2
- "best_metric": 90.63138686131387,
3
- "best_model_checkpoint": "outputs/bitfit/t5-base/superglue-record/checkpoint-21500",
4
  "epoch": 3.0,
5
  "global_step": 25779,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
10
  {
11
  "epoch": 0.06,
12
  "learning_rate": 0.0002941813103689049,
13
- "loss": 0.3506,
14
  "step": 500
15
  },
16
  {
17
- "epoch": 0.06,
18
- "eval_average_metrics": 90.1404240528328,
19
- "eval_em": 89.85401459854015,
20
- "eval_f1": 90.42683350712547,
21
- "eval_loss": 0.23184123635292053,
22
- "eval_runtime": 15.5789,
23
- "eval_samples_per_second": 87.939,
24
- "step": 500
 
 
 
 
 
 
 
 
 
 
25
  },
26
  {
27
  "epoch": 0.12,
28
  "learning_rate": 0.0002883626207378098,
29
- "loss": 0.3505,
30
  "step": 1000
31
  },
32
  {
33
  "epoch": 0.12,
34
- "eval_average_metrics": 89.19586374695865,
35
- "eval_em": 88.75912408759125,
36
- "eval_f1": 89.63260340632604,
37
- "eval_loss": 0.2271701991558075,
38
- "eval_runtime": 15.9901,
39
- "eval_samples_per_second": 85.678,
40
  "step": 1000
41
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
42
  {
43
  "epoch": 0.17,
44
  "learning_rate": 0.00028254393110671474,
45
- "loss": 0.3559,
46
  "step": 1500
47
  },
48
  {
49
- "epoch": 0.17,
50
- "eval_average_metrics": 87.68126520681264,
51
- "eval_em": 87.37226277372262,
52
- "eval_f1": 87.99026763990267,
53
- "eval_loss": 0.23542903363704681,
54
- "eval_runtime": 15.5654,
55
- "eval_samples_per_second": 88.016,
56
- "step": 1500
 
 
 
 
 
 
 
 
 
 
57
  },
58
  {
59
  "epoch": 0.23,
60
  "learning_rate": 0.0002767252414756197,
61
- "loss": 0.3487,
62
  "step": 2000
63
  },
64
  {
65
  "epoch": 0.23,
66
- "eval_average_metrics": 88.3946819603754,
67
- "eval_em": 87.95620437956204,
68
- "eval_f1": 88.83315954118875,
69
- "eval_loss": 0.23398332297801971,
70
- "eval_runtime": 15.718,
71
- "eval_samples_per_second": 87.161,
72
  "step": 2000
73
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
74
  {
75
  "epoch": 0.29,
76
  "learning_rate": 0.0002709065518445246,
77
- "loss": 0.3461,
78
  "step": 2500
79
  },
80
  {
81
- "epoch": 0.29,
82
- "eval_average_metrics": 88.34428223844282,
83
- "eval_em": 88.02919708029196,
84
- "eval_f1": 88.65936739659367,
85
- "eval_loss": 0.23554831743240356,
86
- "eval_runtime": 15.4728,
87
- "eval_samples_per_second": 88.542,
88
- "step": 2500
 
 
 
 
 
 
 
 
 
 
89
  },
90
  {
91
  "epoch": 0.35,
92
  "learning_rate": 0.0002650878622134295,
93
- "loss": 0.3514,
94
  "step": 3000
95
  },
96
  {
97
  "epoch": 0.35,
98
- "eval_average_metrics": 88.32290580465764,
99
- "eval_em": 87.88321167883211,
100
- "eval_f1": 88.76259993048315,
101
- "eval_loss": 0.23650217056274414,
102
- "eval_runtime": 15.254,
103
- "eval_samples_per_second": 89.812,
104
  "step": 3000
105
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
106
  {
107
  "epoch": 0.41,
108
  "learning_rate": 0.00025926917258233445,
109
- "loss": 0.3468,
110
  "step": 3500
111
  },
112
  {
113
- "epoch": 0.41,
114
- "eval_average_metrics": 89.25669099756689,
115
- "eval_em": 88.97810218978101,
116
- "eval_f1": 89.53527980535279,
117
- "eval_loss": 0.22920837998390198,
118
- "eval_runtime": 15.3356,
119
- "eval_samples_per_second": 89.335,
120
- "step": 3500
 
 
 
 
 
 
 
 
 
 
121
  },
122
  {
123
  "epoch": 0.47,
124
  "learning_rate": 0.0002534504829512394,
125
- "loss": 0.3428,
126
  "step": 4000
127
  },
128
  {
129
  "epoch": 0.47,
130
- "eval_average_metrics": 88.33211678832117,
131
- "eval_em": 88.02919708029196,
132
- "eval_f1": 88.63503649635038,
133
- "eval_loss": 0.2317986935377121,
134
- "eval_runtime": 15.4226,
135
- "eval_samples_per_second": 88.831,
136
  "step": 4000
137
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
138
  {
139
  "epoch": 0.52,
140
  "learning_rate": 0.0002476317933201443,
141
- "loss": 0.3485,
142
  "step": 4500
143
  },
144
  {
145
- "epoch": 0.52,
146
- "eval_average_metrics": 87.90024330900243,
147
- "eval_em": 87.66423357664233,
148
- "eval_f1": 88.13625304136254,
149
- "eval_loss": 0.23495055735111237,
150
- "eval_runtime": 15.4567,
151
- "eval_samples_per_second": 88.635,
152
- "step": 4500
 
 
 
 
 
 
 
 
 
 
153
  },
154
  {
155
  "epoch": 0.58,
156
  "learning_rate": 0.0002418131036890492,
157
- "loss": 0.3509,
158
  "step": 5000
159
  },
160
  {
161
  "epoch": 0.58,
162
- "eval_average_metrics": 88.830900243309,
163
- "eval_em": 88.61313868613139,
164
- "eval_f1": 89.04866180048661,
165
- "eval_loss": 0.2319142073392868,
166
- "eval_runtime": 15.5322,
167
- "eval_samples_per_second": 88.204,
168
  "step": 5000
169
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
170
  {
171
  "epoch": 0.64,
172
  "learning_rate": 0.0002359944140579541,
173
- "loss": 0.3427,
174
  "step": 5500
175
  },
176
  {
177
- "epoch": 0.64,
178
- "eval_average_metrics": 86.61678832116789,
179
- "eval_em": 86.27737226277372,
180
- "eval_f1": 86.95620437956205,
181
- "eval_loss": 0.2410917580127716,
182
- "eval_runtime": 15.3636,
183
- "eval_samples_per_second": 89.172,
184
- "step": 5500
 
 
 
 
 
 
 
 
 
 
185
  },
186
  {
187
  "epoch": 0.7,
188
  "learning_rate": 0.00023017572442685905,
189
- "loss": 0.349,
190
  "step": 6000
191
  },
192
  {
193
  "epoch": 0.7,
194
- "eval_average_metrics": 88.17570385818561,
195
- "eval_em": 87.8102189781022,
196
- "eval_f1": 88.54118873826903,
197
- "eval_loss": 0.23763984441757202,
198
- "eval_runtime": 15.6242,
199
- "eval_samples_per_second": 87.684,
200
  "step": 6000
201
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
202
  {
203
  "epoch": 0.76,
204
  "learning_rate": 0.00022435703479576396,
205
- "loss": 0.3404,
206
  "step": 6500
207
  },
208
  {
209
- "epoch": 0.76,
210
- "eval_average_metrics": 88.27128953771289,
211
- "eval_em": 88.02919708029196,
212
- "eval_f1": 88.51338199513381,
213
- "eval_loss": 0.23219799995422363,
214
- "eval_runtime": 15.7753,
215
- "eval_samples_per_second": 86.845,
216
- "step": 6500
 
 
 
 
 
 
 
 
 
 
217
  },
218
  {
219
  "epoch": 0.81,
220
  "learning_rate": 0.0002185383451646689,
221
- "loss": 0.3369,
222
  "step": 7000
223
  },
224
  {
225
  "epoch": 0.81,
226
- "eval_average_metrics": 89.59054570733403,
227
- "eval_em": 89.12408759124088,
228
- "eval_f1": 90.05700382342718,
229
- "eval_loss": 0.2249041497707367,
230
- "eval_runtime": 15.3646,
231
- "eval_samples_per_second": 89.166,
232
  "step": 7000
233
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
234
  {
235
  "epoch": 0.87,
236
  "learning_rate": 0.00021271965553357382,
237
- "loss": 0.3348,
238
  "step": 7500
239
  },
240
  {
241
- "epoch": 0.87,
242
- "eval_average_metrics": 89.87104622871047,
243
- "eval_em": 89.56204379562044,
244
- "eval_f1": 90.1800486618005,
245
- "eval_loss": 0.22438949346542358,
246
- "eval_runtime": 15.6922,
247
- "eval_samples_per_second": 87.305,
248
- "step": 7500
 
 
 
 
 
 
 
 
 
 
249
  },
250
  {
251
  "epoch": 0.93,
252
  "learning_rate": 0.00020690096590247876,
253
- "loss": 0.34,
254
  "step": 8000
255
  },
256
  {
257
  "epoch": 0.93,
258
- "eval_average_metrics": 87.99148418491484,
259
- "eval_em": 87.66423357664233,
260
- "eval_f1": 88.31873479318735,
261
- "eval_loss": 0.23190169036388397,
262
- "eval_runtime": 15.0876,
263
- "eval_samples_per_second": 90.803,
264
  "step": 8000
265
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
266
  {
267
  "epoch": 0.99,
268
  "learning_rate": 0.00020108227627138367,
269
- "loss": 0.3413,
270
  "step": 8500
271
  },
272
  {
273
- "epoch": 0.99,
274
- "eval_average_metrics": 89.0498783454988,
275
- "eval_em": 88.75912408759125,
276
- "eval_f1": 89.34063260340633,
277
- "eval_loss": 0.2290135771036148,
278
- "eval_runtime": 15.6237,
279
- "eval_samples_per_second": 87.688,
280
- "step": 8500
 
 
 
 
 
 
 
 
 
 
281
  },
282
  {
283
  "epoch": 1.05,
284
  "learning_rate": 0.00019526358664028858,
285
- "loss": 0.3207,
286
  "step": 9000
287
  },
288
  {
289
  "epoch": 1.05,
290
- "eval_average_metrics": 89.54257907542579,
291
- "eval_em": 89.34306569343066,
292
- "eval_f1": 89.74209245742092,
293
- "eval_loss": 0.22638055682182312,
294
- "eval_runtime": 15.2056,
295
- "eval_samples_per_second": 90.098,
296
  "step": 9000
297
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
298
  {
299
  "epoch": 1.11,
300
  "learning_rate": 0.00018944489700919352,
301
- "loss": 0.333,
302
  "step": 9500
303
  },
304
  {
305
- "epoch": 1.11,
306
- "eval_average_metrics": 89.5912408759124,
307
- "eval_em": 89.34306569343066,
308
- "eval_f1": 89.83941605839416,
309
- "eval_loss": 0.22846655547618866,
310
- "eval_runtime": 15.7388,
311
- "eval_samples_per_second": 87.046,
312
- "step": 9500
 
 
 
 
 
 
 
 
 
 
313
  },
314
  {
315
  "epoch": 1.16,
316
  "learning_rate": 0.00018362620737809844,
317
- "loss": 0.3313,
318
  "step": 10000
319
  },
320
  {
321
  "epoch": 1.16,
322
- "eval_average_metrics": 88.52485227667711,
323
- "eval_em": 88.17518248175182,
324
- "eval_f1": 88.87452207160239,
325
- "eval_loss": 0.23135380446910858,
326
- "eval_runtime": 15.5843,
327
- "eval_samples_per_second": 87.909,
328
  "step": 10000
329
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
330
  {
331
  "epoch": 1.22,
332
  "learning_rate": 0.00017780751774700338,
333
- "loss": 0.3326,
334
  "step": 10500
335
  },
336
  {
337
- "epoch": 1.22,
338
- "eval_average_metrics": 89.61730969760167,
339
- "eval_em": 89.12408759124088,
340
- "eval_f1": 90.11053180396246,
341
- "eval_loss": 0.22540691494941711,
342
- "eval_runtime": 15.4318,
343
- "eval_samples_per_second": 88.777,
344
- "step": 10500
 
 
 
 
 
 
 
 
 
 
345
  },
346
  {
347
  "epoch": 1.28,
348
  "learning_rate": 0.0001719888281159083,
349
- "loss": 0.3349,
350
  "step": 11000
351
  },
352
  {
353
  "epoch": 1.28,
354
- "eval_average_metrics": 88.49808828640946,
355
- "eval_em": 88.17518248175182,
356
- "eval_f1": 88.82099409106708,
357
- "eval_loss": 0.2274966984987259,
358
- "eval_runtime": 15.7884,
359
- "eval_samples_per_second": 86.773,
360
  "step": 11000
361
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
362
  {
363
  "epoch": 1.34,
364
  "learning_rate": 0.00016617013848481323,
365
- "loss": 0.3268,
366
  "step": 11500
367
  },
368
  {
369
- "epoch": 1.34,
370
- "eval_average_metrics": 90.12043795620437,
371
- "eval_em": 89.7080291970803,
372
- "eval_f1": 90.53284671532846,
373
- "eval_loss": 0.22236795723438263,
374
- "eval_runtime": 15.5257,
375
- "eval_samples_per_second": 88.241,
376
- "step": 11500
 
 
 
 
 
 
 
 
 
 
377
  },
378
  {
379
  "epoch": 1.4,
380
  "learning_rate": 0.00016035144885371815,
381
- "loss": 0.3315,
382
  "step": 12000
383
  },
384
  {
385
  "epoch": 1.4,
386
- "eval_average_metrics": 88.9403892944039,
387
- "eval_em": 88.54014598540147,
388
- "eval_f1": 89.34063260340633,
389
- "eval_loss": 0.22285930812358856,
390
- "eval_runtime": 15.103,
391
- "eval_samples_per_second": 90.71,
392
  "step": 12000
393
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
394
  {
395
  "epoch": 1.45,
396
  "learning_rate": 0.00015453275922262303,
397
- "loss": 0.3262,
398
  "step": 12500
399
  },
400
  {
401
- "epoch": 1.45,
402
- "eval_average_metrics": 86.66718804310045,
403
- "eval_em": 86.27737226277372,
404
- "eval_f1": 87.0570038234272,
405
- "eval_loss": 0.23210552334785461,
406
- "eval_runtime": 15.5946,
407
- "eval_samples_per_second": 87.851,
408
- "step": 12500
 
 
 
 
 
 
 
 
 
 
409
  },
410
  {
411
  "epoch": 1.51,
412
  "learning_rate": 0.00014871406959152797,
413
- "loss": 0.3389,
414
  "step": 13000
415
  },
416
  {
417
  "epoch": 1.51,
418
- "eval_average_metrics": 89.97445255474452,
419
- "eval_em": 89.7080291970803,
420
- "eval_f1": 90.24087591240875,
421
- "eval_loss": 0.22476908564567566,
422
- "eval_runtime": 15.3804,
423
- "eval_samples_per_second": 89.075,
424
  "step": 13000
425
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
426
  {
427
  "epoch": 1.57,
428
  "learning_rate": 0.00014289537996043292,
429
- "loss": 0.324,
430
  "step": 13500
431
  },
432
  {
433
- "epoch": 1.57,
434
- "eval_average_metrics": 88.98470629127564,
435
- "eval_em": 88.54014598540147,
436
- "eval_f1": 89.42926659714982,
437
- "eval_loss": 0.22203609347343445,
438
- "eval_runtime": 15.4489,
439
- "eval_samples_per_second": 88.679,
440
- "step": 13500
 
 
 
 
 
 
 
 
 
 
441
  },
442
  {
443
  "epoch": 1.63,
444
  "learning_rate": 0.00013707669032933783,
445
- "loss": 0.327,
446
  "step": 14000
447
  },
448
  {
449
  "epoch": 1.63,
450
- "eval_average_metrics": 89.79370872436566,
451
- "eval_em": 89.41605839416059,
452
- "eval_f1": 90.17135905457073,
453
- "eval_loss": 0.22265847027301788,
454
- "eval_runtime": 15.2397,
455
- "eval_samples_per_second": 89.897,
456
  "step": 14000
457
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
458
  {
459
  "epoch": 1.69,
460
  "learning_rate": 0.00013125800069824274,
461
- "loss": 0.3315,
462
  "step": 14500
463
  },
464
  {
465
- "epoch": 1.69,
466
- "eval_average_metrics": 89.11678832116787,
467
- "eval_em": 88.83211678832117,
468
- "eval_f1": 89.40145985401458,
469
- "eval_loss": 0.22402139008045197,
470
- "eval_runtime": 15.9941,
471
- "eval_samples_per_second": 85.657,
472
- "step": 14500
 
 
 
 
 
 
 
 
 
 
473
  },
474
  {
475
  "epoch": 1.75,
476
  "learning_rate": 0.00012543931106714766,
477
- "loss": 0.3236,
478
  "step": 15000
479
  },
480
  {
481
  "epoch": 1.75,
482
- "eval_average_metrics": 89.00729927007299,
483
- "eval_em": 88.6861313868613,
484
- "eval_f1": 89.32846715328466,
485
- "eval_loss": 0.22223517298698425,
486
- "eval_runtime": 15.5255,
487
- "eval_samples_per_second": 88.242,
488
  "step": 15000
489
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
490
  {
491
  "epoch": 1.8,
492
  "learning_rate": 0.00011962062143605258,
493
- "loss": 0.3214,
494
  "step": 15500
495
  },
496
  {
497
- "epoch": 1.8,
498
- "eval_average_metrics": 88.32603406326032,
499
- "eval_em": 88.02919708029196,
500
- "eval_f1": 88.6228710462287,
501
- "eval_loss": 0.22402779757976532,
502
- "eval_runtime": 15.9032,
503
- "eval_samples_per_second": 86.146,
504
- "step": 15500
 
 
 
 
 
 
 
 
 
 
505
  },
506
  {
507
  "epoch": 1.86,
508
  "learning_rate": 0.00011380193180495751,
509
- "loss": 0.3254,
510
  "step": 16000
511
  },
512
  {
513
  "epoch": 1.86,
514
- "eval_average_metrics": 89.72506082725062,
515
- "eval_em": 89.48905109489051,
516
- "eval_f1": 89.96107055961072,
517
- "eval_loss": 0.21747739613056183,
518
- "eval_runtime": 15.403,
519
- "eval_samples_per_second": 88.944,
520
  "step": 16000
521
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
522
  {
523
  "epoch": 1.92,
524
  "learning_rate": 0.00010798324217386244,
525
- "loss": 0.3216,
526
  "step": 16500
527
  },
528
  {
529
- "epoch": 1.92,
530
- "eval_average_metrics": 90.24209245742091,
531
- "eval_em": 90.0,
532
- "eval_f1": 90.48418491484183,
533
- "eval_loss": 0.21551567316055298,
534
- "eval_runtime": 15.0664,
535
- "eval_samples_per_second": 90.931,
536
- "step": 16500
 
 
 
 
 
 
 
 
 
 
537
  },
538
  {
539
  "epoch": 1.98,
540
  "learning_rate": 0.00010216455254276737,
541
- "loss": 0.327,
542
  "step": 17000
543
  },
544
  {
545
  "epoch": 1.98,
546
- "eval_average_metrics": 89.62773722627736,
547
- "eval_em": 89.34306569343066,
548
- "eval_f1": 89.91240875912406,
549
- "eval_loss": 0.22303573787212372,
550
- "eval_runtime": 15.6955,
551
- "eval_samples_per_second": 87.286,
552
  "step": 17000
553
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
554
  {
555
  "epoch": 2.04,
556
  "learning_rate": 9.634586291167229e-05,
557
- "loss": 0.3216,
558
  "step": 17500
559
  },
560
  {
561
- "epoch": 2.04,
562
- "eval_average_metrics": 89.6581508515815,
563
- "eval_em": 89.34306569343066,
564
- "eval_f1": 89.97323600973235,
565
- "eval_loss": 0.21931786835193634,
566
- "eval_runtime": 16.0777,
567
- "eval_samples_per_second": 85.211,
568
- "step": 17500
 
 
 
 
 
 
 
 
 
 
569
  },
570
  {
571
  "epoch": 2.09,
572
  "learning_rate": 9.052717328057722e-05,
573
- "loss": 0.3166,
574
  "step": 18000
575
  },
576
  {
577
  "epoch": 2.09,
578
- "eval_average_metrics": 88.78397636426834,
579
- "eval_em": 88.39416058394161,
580
- "eval_f1": 89.17379214459508,
581
- "eval_loss": 0.2221771478652954,
582
- "eval_runtime": 15.5735,
583
- "eval_samples_per_second": 87.97,
584
  "step": 18000
585
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
586
  {
587
  "epoch": 2.15,
588
  "learning_rate": 8.470848364948212e-05,
589
- "loss": 0.321,
590
  "step": 18500
591
  },
592
  {
593
- "epoch": 2.15,
594
- "eval_average_metrics": 90.1508515815085,
595
- "eval_em": 89.92700729927007,
596
- "eval_f1": 90.37469586374695,
597
- "eval_loss": 0.2213568538427353,
598
- "eval_runtime": 15.5146,
599
- "eval_samples_per_second": 88.304,
600
- "step": 18500
 
 
 
 
 
 
 
 
 
 
601
  },
602
  {
603
  "epoch": 2.21,
604
  "learning_rate": 7.888979401838705e-05,
605
- "loss": 0.3099,
606
  "step": 19000
607
  },
608
  {
609
  "epoch": 2.21,
610
- "eval_average_metrics": 90.41240875912409,
611
- "eval_em": 90.14598540145985,
612
- "eval_f1": 90.67883211678833,
613
- "eval_loss": 0.21670033037662506,
614
- "eval_runtime": 15.2815,
615
- "eval_samples_per_second": 89.651,
616
  "step": 19000
617
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
618
  {
619
  "epoch": 2.27,
620
  "learning_rate": 7.307110438729197e-05,
621
- "loss": 0.3178,
622
  "step": 19500
623
  },
624
  {
625
- "epoch": 2.27,
626
- "eval_average_metrics": 89.41484184914842,
627
- "eval_em": 89.19708029197079,
628
- "eval_f1": 89.63260340632604,
629
- "eval_loss": 0.21756400167942047,
630
- "eval_runtime": 15.5668,
631
- "eval_samples_per_second": 88.008,
632
- "step": 19500
 
 
 
 
 
 
 
 
 
 
633
  },
634
  {
635
  "epoch": 2.33,
636
  "learning_rate": 6.72524147561969e-05,
637
- "loss": 0.3082,
638
  "step": 20000
639
  },
640
  {
641
  "epoch": 2.33,
642
- "eval_average_metrics": 90.38807785888078,
643
- "eval_em": 90.14598540145985,
644
- "eval_f1": 90.6301703163017,
645
- "eval_loss": 0.213778555393219,
646
- "eval_runtime": 15.3113,
647
- "eval_samples_per_second": 89.476,
648
  "step": 20000
649
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
650
  {
651
  "epoch": 2.39,
652
  "learning_rate": 6.143372512510183e-05,
653
- "loss": 0.3185,
654
  "step": 20500
655
  },
656
  {
657
- "epoch": 2.39,
658
- "eval_average_metrics": 89.44091067083768,
659
- "eval_em": 89.05109489051095,
660
- "eval_f1": 89.83072645116441,
661
- "eval_loss": 0.21920597553253174,
662
- "eval_runtime": 15.0292,
663
- "eval_samples_per_second": 91.156,
664
- "step": 20500
 
 
 
 
 
 
 
 
 
 
665
  },
666
  {
667
  "epoch": 2.44,
668
  "learning_rate": 5.561503549400675e-05,
669
- "loss": 0.3214,
670
  "step": 21000
671
  },
672
  {
673
  "epoch": 2.44,
674
- "eval_average_metrics": 89.58515815085158,
675
- "eval_em": 89.27007299270073,
676
- "eval_f1": 89.90024330900242,
677
- "eval_loss": 0.21777711808681488,
678
- "eval_runtime": 15.5974,
679
- "eval_samples_per_second": 87.835,
680
  "step": 21000
681
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
682
  {
683
  "epoch": 2.5,
684
  "learning_rate": 4.9796345862911663e-05,
685
- "loss": 0.3204,
686
  "step": 21500
687
  },
688
  {
689
- "epoch": 2.5,
690
- "eval_average_metrics": 90.63138686131387,
691
- "eval_em": 90.36496350364963,
692
- "eval_f1": 90.89781021897811,
693
- "eval_loss": 0.2141435146331787,
694
- "eval_runtime": 15.7201,
695
- "eval_samples_per_second": 87.149,
696
- "step": 21500
 
 
 
 
 
 
 
 
 
 
697
  },
698
  {
699
  "epoch": 2.56,
700
  "learning_rate": 4.397765623181659e-05,
701
- "loss": 0.3219,
702
  "step": 22000
703
  },
704
  {
705
  "epoch": 2.56,
706
- "eval_average_metrics": 89.92579075425792,
707
- "eval_em": 89.56204379562044,
708
- "eval_f1": 90.28953771289538,
709
- "eval_loss": 0.21593248844146729,
710
- "eval_runtime": 15.5402,
711
- "eval_samples_per_second": 88.158,
712
  "step": 22000
713
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
714
  {
715
  "epoch": 2.62,
716
  "learning_rate": 3.815896660072152e-05,
717
- "loss": 0.3082,
718
  "step": 22500
719
  },
720
  {
721
- "epoch": 2.62,
722
- "eval_average_metrics": 90.19343065693431,
723
- "eval_em": 89.92700729927007,
724
- "eval_f1": 90.45985401459853,
725
- "eval_loss": 0.2151171863079071,
726
- "eval_runtime": 15.4013,
727
- "eval_samples_per_second": 88.953,
728
- "step": 22500
 
 
 
 
 
 
 
 
 
 
729
  },
730
  {
731
  "epoch": 2.68,
732
  "learning_rate": 3.234027696962644e-05,
733
- "loss": 0.3139,
734
  "step": 23000
735
  },
736
  {
737
  "epoch": 2.68,
738
- "eval_average_metrics": 90.58272506082724,
739
- "eval_em": 90.2919708029197,
740
- "eval_f1": 90.8734793187348,
741
- "eval_loss": 0.21431832015514374,
742
- "eval_runtime": 15.4496,
743
- "eval_samples_per_second": 88.675,
744
  "step": 23000
745
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
746
  {
747
  "epoch": 2.73,
748
  "learning_rate": 2.6521587338531362e-05,
749
- "loss": 0.3111,
750
  "step": 23500
751
  },
752
  {
753
- "epoch": 2.73,
754
- "eval_average_metrics": 89.7433090024331,
755
- "eval_em": 89.41605839416059,
756
- "eval_f1": 90.0705596107056,
757
- "eval_loss": 0.21385075151920319,
758
- "eval_runtime": 15.7553,
759
- "eval_samples_per_second": 86.955,
760
- "step": 23500
 
 
 
 
 
 
 
 
 
 
761
  },
762
  {
763
  "epoch": 2.79,
764
  "learning_rate": 2.0702897707436283e-05,
765
- "loss": 0.3168,
766
  "step": 24000
767
  },
768
  {
769
  "epoch": 2.79,
770
- "eval_average_metrics": 89.81630170316302,
771
- "eval_em": 89.56204379562044,
772
- "eval_f1": 90.0705596107056,
773
- "eval_loss": 0.2146376520395279,
774
- "eval_runtime": 15.4091,
775
- "eval_samples_per_second": 88.908,
776
  "step": 24000
777
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
778
  {
779
  "epoch": 2.85,
780
  "learning_rate": 1.4884208076341207e-05,
781
- "loss": 0.3115,
782
  "step": 24500
783
  },
784
  {
785
- "epoch": 2.85,
786
- "eval_average_metrics": 89.26885644768856,
787
- "eval_em": 88.97810218978101,
788
- "eval_f1": 89.5596107055961,
789
- "eval_loss": 0.21739177405834198,
790
- "eval_runtime": 15.7449,
791
- "eval_samples_per_second": 87.012,
792
- "step": 24500
 
 
 
 
 
 
 
 
 
 
793
  },
794
  {
795
  "epoch": 2.91,
796
  "learning_rate": 9.065518445246129e-06,
797
- "loss": 0.3144,
798
  "step": 25000
799
  },
800
  {
801
  "epoch": 2.91,
802
- "eval_average_metrics": 90.08394160583941,
803
- "eval_em": 89.78102189781022,
804
- "eval_f1": 90.38686131386861,
805
- "eval_loss": 0.21506215631961823,
806
- "eval_runtime": 15.5375,
807
- "eval_samples_per_second": 88.174,
808
  "step": 25000
809
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
810
  {
811
  "epoch": 2.97,
812
  "learning_rate": 3.2468288141510528e-06,
813
- "loss": 0.3119,
814
  "step": 25500
815
  },
816
  {
817
- "epoch": 2.97,
818
- "eval_average_metrics": 90.10827250608273,
819
- "eval_em": 89.85401459854015,
820
  "eval_f1": 90.36253041362531,
821
- "eval_loss": 0.21424712240695953,
822
- "eval_runtime": 15.4741,
823
- "eval_samples_per_second": 88.535,
824
- "step": 25500
825
  },
826
  {
827
  "epoch": 3.0,
828
  "step": 25779,
829
- "total_flos": 2.1011901579256954e+17,
830
- "train_loss": 0.3297047741756515,
831
- "train_runtime": 5659.5381,
832
- "train_samples_per_second": 72.877,
833
- "train_steps_per_second": 4.555
834
  }
835
  ],
836
  "max_steps": 25779,
837
  "num_train_epochs": 3,
838
- "total_flos": 2.1011901579256954e+17,
839
  "trial_name": null,
840
  "trial_params": null
841
  }
 
1
  {
2
+ "best_metric": 91.36131386861314,
3
+ "best_model_checkpoint": "outputs/bitfit/t5-base/superglue-record/checkpoint-1200",
4
  "epoch": 3.0,
5
  "global_step": 25779,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
+ {
11
+ "epoch": 0.02,
12
+ "eval_average_metrics": 89.01338199513381,
13
+ "eval_em": 88.75912408759125,
14
+ "eval_f1": 89.2676399026764,
15
+ "eval_loss": 0.2185831516981125,
16
+ "eval_runtime": 34.599,
17
+ "eval_samples_per_second": 39.597,
18
+ "step": 200
19
+ },
20
+ {
21
+ "epoch": 0.05,
22
+ "eval_average_metrics": 89.71289537712894,
23
+ "eval_em": 89.48905109489051,
24
+ "eval_f1": 89.93673965936739,
25
+ "eval_loss": 0.22008372843265533,
26
+ "eval_runtime": 36.1565,
27
+ "eval_samples_per_second": 37.891,
28
+ "step": 400
29
+ },
30
  {
31
  "epoch": 0.06,
32
  "learning_rate": 0.0002941813103689049,
33
+ "loss": 0.3381,
34
  "step": 500
35
  },
36
  {
37
+ "epoch": 0.07,
38
+ "eval_average_metrics": 89.17518248175182,
39
+ "eval_em": 88.9051094890511,
40
+ "eval_f1": 89.44525547445255,
41
+ "eval_loss": 0.22487574815750122,
42
+ "eval_runtime": 38.7912,
43
+ "eval_samples_per_second": 35.317,
44
+ "step": 600
45
+ },
46
+ {
47
+ "epoch": 0.09,
48
+ "eval_average_metrics": 90.32725060827251,
49
+ "eval_em": 89.92700729927007,
50
+ "eval_f1": 90.72749391727494,
51
+ "eval_loss": 0.22092510759830475,
52
+ "eval_runtime": 38.8963,
53
+ "eval_samples_per_second": 35.222,
54
+ "step": 800
55
  },
56
  {
57
  "epoch": 0.12,
58
  "learning_rate": 0.0002883626207378098,
59
+ "loss": 0.3288,
60
  "step": 1000
61
  },
62
  {
63
  "epoch": 0.12,
64
+ "eval_average_metrics": 90.82603406326035,
65
+ "eval_em": 90.58394160583941,
66
+ "eval_f1": 91.06812652068128,
67
+ "eval_loss": 0.2161024510860443,
68
+ "eval_runtime": 38.0375,
69
+ "eval_samples_per_second": 36.017,
70
  "step": 1000
71
  },
72
+ {
73
+ "epoch": 0.14,
74
+ "eval_average_metrics": 91.36131386861314,
75
+ "eval_em": 91.0948905109489,
76
+ "eval_f1": 91.62773722627739,
77
+ "eval_loss": 0.21504777669906616,
78
+ "eval_runtime": 36.1024,
79
+ "eval_samples_per_second": 37.948,
80
+ "step": 1200
81
+ },
82
+ {
83
+ "epoch": 0.16,
84
+ "eval_average_metrics": 89.69829683698296,
85
+ "eval_em": 89.41605839416059,
86
+ "eval_f1": 89.98053527980535,
87
+ "eval_loss": 0.21785993874073029,
88
+ "eval_runtime": 38.4041,
89
+ "eval_samples_per_second": 35.673,
90
+ "step": 1400
91
+ },
92
  {
93
  "epoch": 0.17,
94
  "learning_rate": 0.00028254393110671474,
95
+ "loss": 0.333,
96
  "step": 1500
97
  },
98
  {
99
+ "epoch": 0.19,
100
+ "eval_average_metrics": 89.78345498783455,
101
+ "eval_em": 89.34306569343066,
102
+ "eval_f1": 90.22384428223845,
103
+ "eval_loss": 0.21883782744407654,
104
+ "eval_runtime": 35.4761,
105
+ "eval_samples_per_second": 38.618,
106
+ "step": 1600
107
+ },
108
+ {
109
+ "epoch": 0.21,
110
+ "eval_average_metrics": 89.54866180048661,
111
+ "eval_em": 89.41605839416059,
112
+ "eval_f1": 89.68126520681264,
113
+ "eval_loss": 0.22056403756141663,
114
+ "eval_runtime": 35.8766,
115
+ "eval_samples_per_second": 38.186,
116
+ "step": 1800
117
  },
118
  {
119
  "epoch": 0.23,
120
  "learning_rate": 0.0002767252414756197,
121
+ "loss": 0.3283,
122
  "step": 2000
123
  },
124
  {
125
  "epoch": 0.23,
126
+ "eval_average_metrics": 88.84306569343067,
127
+ "eval_em": 88.39416058394161,
128
+ "eval_f1": 89.29197080291972,
129
+ "eval_loss": 0.22133098542690277,
130
+ "eval_runtime": 36.0963,
131
+ "eval_samples_per_second": 37.954,
132
  "step": 2000
133
  },
134
+ {
135
+ "epoch": 0.26,
136
+ "eval_average_metrics": 89.49391727493916,
137
+ "eval_em": 89.19708029197079,
138
+ "eval_f1": 89.79075425790754,
139
+ "eval_loss": 0.22017844021320343,
140
+ "eval_runtime": 36.292,
141
+ "eval_samples_per_second": 37.749,
142
+ "step": 2200
143
+ },
144
+ {
145
+ "epoch": 0.28,
146
+ "eval_average_metrics": 90.77737226277371,
147
+ "eval_em": 90.43795620437956,
148
+ "eval_f1": 91.11678832116786,
149
+ "eval_loss": 0.21572071313858032,
150
+ "eval_runtime": 38.375,
151
+ "eval_samples_per_second": 35.7,
152
+ "step": 2400
153
+ },
154
  {
155
  "epoch": 0.29,
156
  "learning_rate": 0.0002709065518445246,
157
+ "loss": 0.3258,
158
  "step": 2500
159
  },
160
  {
161
+ "epoch": 0.3,
162
+ "eval_average_metrics": 90.58880778588806,
163
+ "eval_em": 90.2919708029197,
164
+ "eval_f1": 90.88564476885644,
165
+ "eval_loss": 0.21875151991844177,
166
+ "eval_runtime": 36.4713,
167
+ "eval_samples_per_second": 37.564,
168
+ "step": 2600
169
+ },
170
+ {
171
+ "epoch": 0.33,
172
+ "eval_average_metrics": 89.81630170316302,
173
+ "eval_em": 89.48905109489051,
174
+ "eval_f1": 90.14355231143553,
175
+ "eval_loss": 0.22119711339473724,
176
+ "eval_runtime": 36.7112,
177
+ "eval_samples_per_second": 37.318,
178
+ "step": 2800
179
  },
180
  {
181
  "epoch": 0.35,
182
  "learning_rate": 0.0002650878622134295,
183
+ "loss": 0.3308,
184
  "step": 3000
185
  },
186
  {
187
  "epoch": 0.35,
188
+ "eval_average_metrics": 89.86253041362531,
189
+ "eval_em": 89.41605839416059,
190
+ "eval_f1": 90.30900243309003,
191
+ "eval_loss": 0.21812815964221954,
192
+ "eval_runtime": 35.9089,
193
+ "eval_samples_per_second": 38.152,
194
  "step": 3000
195
  },
196
+ {
197
+ "epoch": 0.37,
198
+ "eval_average_metrics": 90.68004866180048,
199
+ "eval_em": 90.2919708029197,
200
+ "eval_f1": 91.06812652068126,
201
+ "eval_loss": 0.21945150196552277,
202
+ "eval_runtime": 36.7647,
203
+ "eval_samples_per_second": 37.264,
204
+ "step": 3200
205
+ },
206
+ {
207
+ "epoch": 0.4,
208
+ "eval_average_metrics": 88.52676399026764,
209
+ "eval_em": 88.24817518248175,
210
+ "eval_f1": 88.80535279805353,
211
+ "eval_loss": 0.22326913475990295,
212
+ "eval_runtime": 38.4494,
213
+ "eval_samples_per_second": 35.631,
214
+ "step": 3400
215
+ },
216
  {
217
  "epoch": 0.41,
218
  "learning_rate": 0.00025926917258233445,
219
+ "loss": 0.3268,
220
  "step": 3500
221
  },
222
  {
223
+ "epoch": 0.42,
224
+ "eval_average_metrics": 89.9014598540146,
225
+ "eval_em": 89.56204379562044,
226
+ "eval_f1": 90.24087591240875,
227
+ "eval_loss": 0.2204274833202362,
228
+ "eval_runtime": 39.4301,
229
+ "eval_samples_per_second": 34.745,
230
+ "step": 3600
231
+ },
232
+ {
233
+ "epoch": 0.44,
234
+ "eval_average_metrics": 88.8491484184915,
235
+ "eval_em": 88.54014598540147,
236
+ "eval_f1": 89.15815085158151,
237
+ "eval_loss": 0.22101299464702606,
238
+ "eval_runtime": 36.7124,
239
+ "eval_samples_per_second": 37.317,
240
+ "step": 3800
241
  },
242
  {
243
  "epoch": 0.47,
244
  "learning_rate": 0.0002534504829512394,
245
+ "loss": 0.3266,
246
  "step": 4000
247
  },
248
  {
249
  "epoch": 0.47,
250
+ "eval_average_metrics": 90.43673965936739,
251
+ "eval_em": 90.07299270072993,
252
+ "eval_f1": 90.80048661800487,
253
+ "eval_loss": 0.2189851850271225,
254
+ "eval_runtime": 38.8738,
255
+ "eval_samples_per_second": 35.242,
256
  "step": 4000
257
  },
258
+ {
259
+ "epoch": 0.49,
260
+ "eval_average_metrics": 88.7676399026764,
261
+ "eval_em": 88.39416058394161,
262
+ "eval_f1": 89.14111922141119,
263
+ "eval_loss": 0.22029492259025574,
264
+ "eval_runtime": 37.8194,
265
+ "eval_samples_per_second": 36.225,
266
+ "step": 4200
267
+ },
268
+ {
269
+ "epoch": 0.51,
270
+ "eval_average_metrics": 89.73722627737226,
271
+ "eval_em": 89.41605839416059,
272
+ "eval_f1": 90.05839416058394,
273
+ "eval_loss": 0.21841323375701904,
274
+ "eval_runtime": 39.6246,
275
+ "eval_samples_per_second": 34.575,
276
+ "step": 4400
277
+ },
278
  {
279
  "epoch": 0.52,
280
  "learning_rate": 0.0002476317933201443,
281
+ "loss": 0.3309,
282
  "step": 4500
283
  },
284
  {
285
+ "epoch": 0.54,
286
+ "eval_average_metrics": 89.49391727493918,
287
+ "eval_em": 89.27007299270073,
288
+ "eval_f1": 89.71776155717761,
289
+ "eval_loss": 0.2204442322254181,
290
+ "eval_runtime": 39.9817,
291
+ "eval_samples_per_second": 34.266,
292
+ "step": 4600
293
+ },
294
+ {
295
+ "epoch": 0.56,
296
+ "eval_average_metrics": 89.69464720194647,
297
+ "eval_em": 89.34306569343066,
298
+ "eval_f1": 90.04622871046227,
299
+ "eval_loss": 0.2244672179222107,
300
+ "eval_runtime": 38.4253,
301
+ "eval_samples_per_second": 35.654,
302
+ "step": 4800
303
  },
304
  {
305
  "epoch": 0.58,
306
  "learning_rate": 0.0002418131036890492,
307
+ "loss": 0.3285,
308
  "step": 5000
309
  },
310
  {
311
  "epoch": 0.58,
312
+ "eval_average_metrics": 89.48783454987836,
313
+ "eval_em": 89.27007299270073,
314
+ "eval_f1": 89.70559610705597,
315
+ "eval_loss": 0.21830883622169495,
316
+ "eval_runtime": 38.7825,
317
+ "eval_samples_per_second": 35.325,
318
  "step": 5000
319
  },
320
+ {
321
+ "epoch": 0.61,
322
+ "eval_average_metrics": 88.56326034063261,
323
+ "eval_em": 88.32116788321169,
324
+ "eval_f1": 88.80535279805352,
325
+ "eval_loss": 0.22253794968128204,
326
+ "eval_runtime": 38.0561,
327
+ "eval_samples_per_second": 36.0,
328
+ "step": 5200
329
+ },
330
+ {
331
+ "epoch": 0.63,
332
+ "eval_average_metrics": 89.82846715328466,
333
+ "eval_em": 89.56204379562044,
334
+ "eval_f1": 90.09489051094889,
335
+ "eval_loss": 0.22128665447235107,
336
+ "eval_runtime": 39.7387,
337
+ "eval_samples_per_second": 34.475,
338
+ "step": 5400
339
+ },
340
  {
341
  "epoch": 0.64,
342
  "learning_rate": 0.0002359944140579541,
343
+ "loss": 0.3296,
344
  "step": 5500
345
  },
346
  {
347
+ "epoch": 0.65,
348
+ "eval_average_metrics": 89.02919708029196,
349
+ "eval_em": 88.6861313868613,
350
+ "eval_f1": 89.37226277372264,
351
+ "eval_loss": 0.2234881967306137,
352
+ "eval_runtime": 38.4221,
353
+ "eval_samples_per_second": 35.657,
354
+ "step": 5600
355
+ },
356
+ {
357
+ "epoch": 0.67,
358
+ "eval_average_metrics": 89.64355231143553,
359
+ "eval_em": 89.34306569343066,
360
+ "eval_f1": 89.9440389294404,
361
+ "eval_loss": 0.2219015508890152,
362
+ "eval_runtime": 39.7412,
363
+ "eval_samples_per_second": 34.473,
364
+ "step": 5800
365
  },
366
  {
367
  "epoch": 0.7,
368
  "learning_rate": 0.00023017572442685905,
369
+ "loss": 0.3377,
370
  "step": 6000
371
  },
372
  {
373
  "epoch": 0.7,
374
+ "eval_average_metrics": 89.13503649635037,
375
+ "eval_em": 88.9051094890511,
376
+ "eval_f1": 89.36496350364963,
377
+ "eval_loss": 0.22565637528896332,
378
+ "eval_runtime": 38.9351,
379
+ "eval_samples_per_second": 35.187,
380
  "step": 6000
381
  },
382
+ {
383
+ "epoch": 0.72,
384
+ "eval_average_metrics": 89.66788321167883,
385
+ "eval_em": 89.34306569343066,
386
+ "eval_f1": 89.99270072992701,
387
+ "eval_loss": 0.2238757461309433,
388
+ "eval_runtime": 36.8334,
389
+ "eval_samples_per_second": 37.195,
390
+ "step": 6200
391
+ },
392
+ {
393
+ "epoch": 0.74,
394
+ "eval_average_metrics": 90.63138686131386,
395
+ "eval_em": 90.2919708029197,
396
+ "eval_f1": 90.970802919708,
397
+ "eval_loss": 0.2218635529279709,
398
+ "eval_runtime": 39.5931,
399
+ "eval_samples_per_second": 34.602,
400
+ "step": 6400
401
+ },
402
  {
403
  "epoch": 0.76,
404
  "learning_rate": 0.00022435703479576396,
405
+ "loss": 0.3271,
406
  "step": 6500
407
  },
408
  {
409
+ "epoch": 0.77,
410
+ "eval_average_metrics": 90.15450121654501,
411
+ "eval_em": 89.85401459854015,
412
+ "eval_f1": 90.45498783454988,
413
+ "eval_loss": 0.2218872755765915,
414
+ "eval_runtime": 36.9426,
415
+ "eval_samples_per_second": 37.085,
416
+ "step": 6600
417
+ },
418
+ {
419
+ "epoch": 0.79,
420
+ "eval_average_metrics": 90.49513381995133,
421
+ "eval_em": 90.14598540145985,
422
+ "eval_f1": 90.84428223844282,
423
+ "eval_loss": 0.2184651792049408,
424
+ "eval_runtime": 38.3744,
425
+ "eval_samples_per_second": 35.701,
426
+ "step": 6800
427
  },
428
  {
429
  "epoch": 0.81,
430
  "learning_rate": 0.0002185383451646689,
431
+ "loss": 0.3221,
432
  "step": 7000
433
  },
434
  {
435
  "epoch": 0.81,
436
+ "eval_average_metrics": 91.12773722627736,
437
+ "eval_em": 90.8029197080292,
438
+ "eval_f1": 91.45255474452554,
439
+ "eval_loss": 0.2153433859348297,
440
+ "eval_runtime": 38.0801,
441
+ "eval_samples_per_second": 35.977,
442
  "step": 7000
443
  },
444
+ {
445
+ "epoch": 0.84,
446
+ "eval_average_metrics": 90.32481751824818,
447
+ "eval_em": 90.0,
448
+ "eval_f1": 90.64963503649636,
449
+ "eval_loss": 0.21808864176273346,
450
+ "eval_runtime": 39.0051,
451
+ "eval_samples_per_second": 35.124,
452
+ "step": 7200
453
+ },
454
+ {
455
+ "epoch": 0.86,
456
+ "eval_average_metrics": 89.08394160583941,
457
+ "eval_em": 88.75912408759125,
458
+ "eval_f1": 89.4087591240876,
459
+ "eval_loss": 0.22276869416236877,
460
+ "eval_runtime": 36.749,
461
+ "eval_samples_per_second": 37.28,
462
+ "step": 7400
463
+ },
464
  {
465
  "epoch": 0.87,
466
  "learning_rate": 0.00021271965553357382,
467
+ "loss": 0.3226,
468
  "step": 7500
469
  },
470
  {
471
+ "epoch": 0.88,
472
+ "eval_average_metrics": 90.485401459854,
473
+ "eval_em": 90.21897810218978,
474
+ "eval_f1": 90.75182481751823,
475
+ "eval_loss": 0.21675343811511993,
476
+ "eval_runtime": 37.5554,
477
+ "eval_samples_per_second": 36.479,
478
+ "step": 7600
479
+ },
480
+ {
481
+ "epoch": 0.91,
482
+ "eval_average_metrics": 90.02311435523114,
483
+ "eval_em": 89.78102189781022,
484
+ "eval_f1": 90.26520681265205,
485
+ "eval_loss": 0.21614064276218414,
486
+ "eval_runtime": 33.4296,
487
+ "eval_samples_per_second": 40.982,
488
+ "step": 7800
489
  },
490
  {
491
  "epoch": 0.93,
492
  "learning_rate": 0.00020690096590247876,
493
+ "loss": 0.3262,
494
  "step": 8000
495
  },
496
  {
497
  "epoch": 0.93,
498
+ "eval_average_metrics": 90.10583941605839,
499
+ "eval_em": 89.78102189781022,
500
+ "eval_f1": 90.43065693430657,
501
+ "eval_loss": 0.2208666056394577,
502
+ "eval_runtime": 35.7275,
503
+ "eval_samples_per_second": 38.346,
504
  "step": 8000
505
  },
506
+ {
507
+ "epoch": 0.95,
508
+ "eval_average_metrics": 88.86253041362531,
509
+ "eval_em": 88.46715328467153,
510
+ "eval_f1": 89.25790754257908,
511
+ "eval_loss": 0.22296273708343506,
512
+ "eval_runtime": 37.4484,
513
+ "eval_samples_per_second": 36.584,
514
+ "step": 8200
515
+ },
516
+ {
517
+ "epoch": 0.98,
518
+ "eval_average_metrics": 88.69708029197079,
519
+ "eval_em": 88.39416058394161,
520
+ "eval_f1": 88.99999999999999,
521
+ "eval_loss": 0.2256641685962677,
522
+ "eval_runtime": 36.1104,
523
+ "eval_samples_per_second": 37.939,
524
+ "step": 8400
525
+ },
526
  {
527
  "epoch": 0.99,
528
  "learning_rate": 0.00020108227627138367,
529
+ "loss": 0.3246,
530
  "step": 8500
531
  },
532
  {
533
+ "epoch": 1.0,
534
+ "eval_average_metrics": 90.43673965936739,
535
+ "eval_em": 90.14598540145985,
536
+ "eval_f1": 90.72749391727494,
537
+ "eval_loss": 0.2168925255537033,
538
+ "eval_runtime": 36.8057,
539
+ "eval_samples_per_second": 37.223,
540
+ "step": 8600
541
+ },
542
+ {
543
+ "epoch": 1.02,
544
+ "eval_average_metrics": 90.17883211678833,
545
+ "eval_em": 89.85401459854015,
546
+ "eval_f1": 90.5036496350365,
547
+ "eval_loss": 0.21890240907669067,
548
+ "eval_runtime": 36.2138,
549
+ "eval_samples_per_second": 37.831,
550
+ "step": 8800
551
  },
552
  {
553
  "epoch": 1.05,
554
  "learning_rate": 0.00019526358664028858,
555
+ "loss": 0.3085,
556
  "step": 9000
557
  },
558
  {
559
  "epoch": 1.05,
560
+ "eval_average_metrics": 90.25182481751824,
561
+ "eval_em": 90.0,
562
+ "eval_f1": 90.5036496350365,
563
+ "eval_loss": 0.21791431307792664,
564
+ "eval_runtime": 36.94,
565
+ "eval_samples_per_second": 37.087,
566
  "step": 9000
567
  },
568
+ {
569
+ "epoch": 1.07,
570
+ "eval_average_metrics": 90.31508515815085,
571
+ "eval_em": 90.07299270072993,
572
+ "eval_f1": 90.55717761557177,
573
+ "eval_loss": 0.2160734087228775,
574
+ "eval_runtime": 35.6639,
575
+ "eval_samples_per_second": 38.414,
576
+ "step": 9200
577
+ },
578
+ {
579
+ "epoch": 1.09,
580
+ "eval_average_metrics": 89.48783454987836,
581
+ "eval_em": 89.27007299270073,
582
+ "eval_f1": 89.70559610705597,
583
+ "eval_loss": 0.22037485241889954,
584
+ "eval_runtime": 37.8808,
585
+ "eval_samples_per_second": 36.166,
586
+ "step": 9400
587
+ },
588
  {
589
  "epoch": 1.11,
590
  "learning_rate": 0.00018944489700919352,
591
+ "loss": 0.3185,
592
  "step": 9500
593
  },
594
  {
595
+ "epoch": 1.12,
596
+ "eval_average_metrics": 88.35401459854015,
597
+ "eval_em": 88.02919708029196,
598
+ "eval_f1": 88.67883211678833,
599
+ "eval_loss": 0.22213077545166016,
600
+ "eval_runtime": 36.2657,
601
+ "eval_samples_per_second": 37.777,
602
+ "step": 9600
603
+ },
604
+ {
605
+ "epoch": 1.14,
606
+ "eval_average_metrics": 87.77007299270073,
607
+ "eval_em": 87.44525547445255,
608
+ "eval_f1": 88.09489051094891,
609
+ "eval_loss": 0.22431711852550507,
610
+ "eval_runtime": 34.0786,
611
+ "eval_samples_per_second": 40.201,
612
+ "step": 9800
613
  },
614
  {
615
  "epoch": 1.16,
616
  "learning_rate": 0.00018362620737809844,
617
+ "loss": 0.3149,
618
  "step": 10000
619
  },
620
  {
621
  "epoch": 1.16,
622
+ "eval_average_metrics": 88.28953771289537,
623
+ "eval_em": 88.02919708029196,
624
+ "eval_f1": 88.54987834549878,
625
+ "eval_loss": 0.2239065319299698,
626
+ "eval_runtime": 37.3216,
627
+ "eval_samples_per_second": 36.708,
628
  "step": 10000
629
  },
630
+ {
631
+ "epoch": 1.19,
632
+ "eval_average_metrics": 90.12043795620437,
633
+ "eval_em": 89.85401459854015,
634
+ "eval_f1": 90.3868613138686,
635
+ "eval_loss": 0.21789653599262238,
636
+ "eval_runtime": 35.8306,
637
+ "eval_samples_per_second": 38.235,
638
+ "step": 10200
639
+ },
640
+ {
641
+ "epoch": 1.21,
642
+ "eval_average_metrics": 89.71654501216544,
643
+ "eval_em": 89.41605839416059,
644
+ "eval_f1": 90.0170316301703,
645
+ "eval_loss": 0.2222936451435089,
646
+ "eval_runtime": 35.4154,
647
+ "eval_samples_per_second": 38.684,
648
+ "step": 10400
649
+ },
650
  {
651
  "epoch": 1.22,
652
  "learning_rate": 0.00017780751774700338,
653
+ "loss": 0.3167,
654
  "step": 10500
655
  },
656
  {
657
+ "epoch": 1.23,
658
+ "eval_average_metrics": 89.19586374695864,
659
+ "eval_em": 88.83211678832117,
660
+ "eval_f1": 89.5596107055961,
661
+ "eval_loss": 0.22271069884300232,
662
+ "eval_runtime": 35.7044,
663
+ "eval_samples_per_second": 38.371,
664
+ "step": 10600
665
+ },
666
+ {
667
+ "epoch": 1.26,
668
+ "eval_average_metrics": 89.97445255474452,
669
+ "eval_em": 89.7080291970803,
670
+ "eval_f1": 90.24087591240875,
671
+ "eval_loss": 0.22066636383533478,
672
+ "eval_runtime": 34.2308,
673
+ "eval_samples_per_second": 40.022,
674
+ "step": 10800
675
  },
676
  {
677
  "epoch": 1.28,
678
  "learning_rate": 0.0001719888281159083,
679
+ "loss": 0.3179,
680
  "step": 11000
681
  },
682
  {
683
  "epoch": 1.28,
684
+ "eval_average_metrics": 90.05717761557177,
685
+ "eval_em": 89.78102189781022,
686
+ "eval_f1": 90.33333333333333,
687
+ "eval_loss": 0.2182897925376892,
688
+ "eval_runtime": 36.8191,
689
+ "eval_samples_per_second": 37.209,
690
  "step": 11000
691
  },
692
+ {
693
+ "epoch": 1.3,
694
+ "eval_average_metrics": 88.34428223844282,
695
+ "eval_em": 88.02919708029196,
696
+ "eval_f1": 88.65936739659367,
697
+ "eval_loss": 0.22293207049369812,
698
+ "eval_runtime": 38.8183,
699
+ "eval_samples_per_second": 35.293,
700
+ "step": 11200
701
+ },
702
+ {
703
+ "epoch": 1.33,
704
+ "eval_average_metrics": 90.60705596107056,
705
+ "eval_em": 90.36496350364963,
706
+ "eval_f1": 90.84914841849148,
707
+ "eval_loss": 0.2161208987236023,
708
+ "eval_runtime": 38.6684,
709
+ "eval_samples_per_second": 35.429,
710
+ "step": 11400
711
+ },
712
  {
713
  "epoch": 1.34,
714
  "learning_rate": 0.00016617013848481323,
715
+ "loss": 0.3153,
716
  "step": 11500
717
  },
718
  {
719
+ "epoch": 1.35,
720
+ "eval_average_metrics": 90.38807785888078,
721
+ "eval_em": 90.14598540145985,
722
+ "eval_f1": 90.6301703163017,
723
+ "eval_loss": 0.2135632187128067,
724
+ "eval_runtime": 38.983,
725
+ "eval_samples_per_second": 35.144,
726
+ "step": 11600
727
+ },
728
+ {
729
+ "epoch": 1.37,
730
+ "eval_average_metrics": 89.14720194647202,
731
+ "eval_em": 88.9051094890511,
732
+ "eval_f1": 89.38929440389293,
733
+ "eval_loss": 0.22012485563755035,
734
+ "eval_runtime": 39.657,
735
+ "eval_samples_per_second": 34.546,
736
+ "step": 11800
737
  },
738
  {
739
  "epoch": 1.4,
740
  "learning_rate": 0.00016035144885371815,
741
+ "loss": 0.3216,
742
  "step": 12000
743
  },
744
  {
745
  "epoch": 1.4,
746
+ "eval_average_metrics": 89.6581508515815,
747
+ "eval_em": 89.41605839416059,
748
+ "eval_f1": 89.90024330900242,
749
+ "eval_loss": 0.21762309968471527,
750
+ "eval_runtime": 40.4674,
751
+ "eval_samples_per_second": 33.854,
752
  "step": 12000
753
  },
754
+ {
755
+ "epoch": 1.42,
756
+ "eval_average_metrics": 89.30535279805352,
757
+ "eval_em": 89.05109489051095,
758
+ "eval_f1": 89.5596107055961,
759
+ "eval_loss": 0.21773971617221832,
760
+ "eval_runtime": 38.4174,
761
+ "eval_samples_per_second": 35.661,
762
+ "step": 12200
763
+ },
764
+ {
765
+ "epoch": 1.44,
766
+ "eval_average_metrics": 90.169099756691,
767
+ "eval_em": 89.92700729927007,
768
+ "eval_f1": 90.41119221411194,
769
+ "eval_loss": 0.21440057456493378,
770
+ "eval_runtime": 37.9225,
771
+ "eval_samples_per_second": 36.126,
772
+ "step": 12400
773
+ },
774
  {
775
  "epoch": 1.45,
776
  "learning_rate": 0.00015453275922262303,
777
+ "loss": 0.3151,
778
  "step": 12500
779
  },
780
  {
781
+ "epoch": 1.47,
782
+ "eval_average_metrics": 89.58515815085158,
783
+ "eval_em": 89.34306569343066,
784
+ "eval_f1": 89.82725060827251,
785
+ "eval_loss": 0.21768692135810852,
786
+ "eval_runtime": 36.5526,
787
+ "eval_samples_per_second": 37.48,
788
+ "step": 12600
789
+ },
790
+ {
791
+ "epoch": 1.49,
792
+ "eval_average_metrics": 89.99878345498783,
793
+ "eval_em": 89.78102189781022,
794
+ "eval_f1": 90.21654501216545,
795
+ "eval_loss": 0.2161240428686142,
796
+ "eval_runtime": 39.5978,
797
+ "eval_samples_per_second": 34.598,
798
+ "step": 12800
799
  },
800
  {
801
  "epoch": 1.51,
802
  "learning_rate": 0.00014871406959152797,
803
+ "loss": 0.3255,
804
  "step": 13000
805
  },
806
  {
807
  "epoch": 1.51,
808
+ "eval_average_metrics": 89.70681265206812,
809
+ "eval_em": 89.48905109489051,
810
+ "eval_f1": 89.92457420924575,
811
+ "eval_loss": 0.21710088849067688,
812
+ "eval_runtime": 38.5743,
813
+ "eval_samples_per_second": 35.516,
814
  "step": 13000
815
  },
816
+ {
817
+ "epoch": 1.54,
818
+ "eval_average_metrics": 89.3515815085158,
819
+ "eval_em": 89.05109489051095,
820
+ "eval_f1": 89.65206812652067,
821
+ "eval_loss": 0.21740640699863434,
822
+ "eval_runtime": 38.7743,
823
+ "eval_samples_per_second": 35.333,
824
+ "step": 13200
825
+ },
826
+ {
827
+ "epoch": 1.56,
828
+ "eval_average_metrics": 90.29075425790754,
829
+ "eval_em": 90.07299270072993,
830
+ "eval_f1": 90.50851581508516,
831
+ "eval_loss": 0.21489615738391876,
832
+ "eval_runtime": 41.332,
833
+ "eval_samples_per_second": 33.146,
834
+ "step": 13400
835
+ },
836
  {
837
  "epoch": 1.57,
838
  "learning_rate": 0.00014289537996043292,
839
+ "loss": 0.3129,
840
  "step": 13500
841
  },
842
  {
843
+ "epoch": 1.58,
844
+ "eval_average_metrics": 89.81386861313868,
845
+ "eval_em": 89.48905109489051,
846
+ "eval_f1": 90.13868613138686,
847
+ "eval_loss": 0.21436673402786255,
848
+ "eval_runtime": 39.3785,
849
+ "eval_samples_per_second": 34.791,
850
+ "step": 13600
851
+ },
852
+ {
853
+ "epoch": 1.61,
854
+ "eval_average_metrics": 89.77980535279806,
855
+ "eval_em": 89.48905109489051,
856
+ "eval_f1": 90.0705596107056,
857
+ "eval_loss": 0.21632547676563263,
858
+ "eval_runtime": 36.2514,
859
+ "eval_samples_per_second": 37.792,
860
+ "step": 13800
861
  },
862
  {
863
  "epoch": 1.63,
864
  "learning_rate": 0.00013707669032933783,
865
+ "loss": 0.317,
866
  "step": 14000
867
  },
868
  {
869
  "epoch": 1.63,
870
+ "eval_average_metrics": 90.14476885644768,
871
+ "eval_em": 89.85401459854015,
872
+ "eval_f1": 90.43552311435523,
873
+ "eval_loss": 0.21579378843307495,
874
+ "eval_runtime": 38.9315,
875
+ "eval_samples_per_second": 35.19,
876
  "step": 14000
877
  },
878
+ {
879
+ "epoch": 1.65,
880
+ "eval_average_metrics": 89.69221411192214,
881
+ "eval_em": 89.34306569343066,
882
+ "eval_f1": 90.04136253041362,
883
+ "eval_loss": 0.21815675497055054,
884
+ "eval_runtime": 38.141,
885
+ "eval_samples_per_second": 35.919,
886
+ "step": 14200
887
+ },
888
+ {
889
+ "epoch": 1.68,
890
+ "eval_average_metrics": 90.26642335766422,
891
+ "eval_em": 90.0,
892
+ "eval_f1": 90.53284671532845,
893
+ "eval_loss": 0.21684660017490387,
894
+ "eval_runtime": 36.4617,
895
+ "eval_samples_per_second": 37.574,
896
+ "step": 14400
897
+ },
898
  {
899
  "epoch": 1.69,
900
  "learning_rate": 0.00013125800069824274,
901
+ "loss": 0.3204,
902
  "step": 14500
903
  },
904
  {
905
+ "epoch": 1.7,
906
+ "eval_average_metrics": 90.54379562043796,
907
+ "eval_em": 90.21897810218978,
908
+ "eval_f1": 90.86861313868614,
909
+ "eval_loss": 0.21547624468803406,
910
+ "eval_runtime": 39.6007,
911
+ "eval_samples_per_second": 34.595,
912
+ "step": 14600
913
+ },
914
+ {
915
+ "epoch": 1.72,
916
+ "eval_average_metrics": 90.76277372262774,
917
+ "eval_em": 90.43795620437956,
918
+ "eval_f1": 91.08759124087592,
919
+ "eval_loss": 0.2154303342103958,
920
+ "eval_runtime": 37.9795,
921
+ "eval_samples_per_second": 36.072,
922
+ "step": 14800
923
  },
924
  {
925
  "epoch": 1.75,
926
  "learning_rate": 0.00012543931106714766,
927
+ "loss": 0.3153,
928
  "step": 15000
929
  },
930
  {
931
  "epoch": 1.75,
932
+ "eval_average_metrics": 90.34914841849148,
933
+ "eval_em": 90.0,
934
+ "eval_f1": 90.69829683698296,
935
+ "eval_loss": 0.21602213382720947,
936
+ "eval_runtime": 40.2922,
937
+ "eval_samples_per_second": 34.002,
938
  "step": 15000
939
  },
940
+ {
941
+ "epoch": 1.77,
942
+ "eval_average_metrics": 89.31751824817519,
943
+ "eval_em": 89.05109489051095,
944
+ "eval_f1": 89.58394160583941,
945
+ "eval_loss": 0.2179516851902008,
946
+ "eval_runtime": 36.6124,
947
+ "eval_samples_per_second": 37.419,
948
+ "step": 15200
949
+ },
950
+ {
951
+ "epoch": 1.79,
952
+ "eval_average_metrics": 89.24452554744525,
953
+ "eval_em": 88.97810218978101,
954
+ "eval_f1": 89.51094890510949,
955
+ "eval_loss": 0.2189921736717224,
956
+ "eval_runtime": 37.6709,
957
+ "eval_samples_per_second": 36.368,
958
+ "step": 15400
959
+ },
960
  {
961
  "epoch": 1.8,
962
  "learning_rate": 0.00011962062143605258,
963
+ "loss": 0.3104,
964
  "step": 15500
965
  },
966
  {
967
+ "epoch": 1.82,
968
+ "eval_average_metrics": 89.02554744525548,
969
+ "eval_em": 88.75912408759125,
970
+ "eval_f1": 89.29197080291972,
971
+ "eval_loss": 0.21728622913360596,
972
+ "eval_runtime": 37.6931,
973
+ "eval_samples_per_second": 36.346,
974
+ "step": 15600
975
+ },
976
+ {
977
+ "epoch": 1.84,
978
+ "eval_average_metrics": 90.48540145985402,
979
+ "eval_em": 90.21897810218978,
980
+ "eval_f1": 90.75182481751824,
981
+ "eval_loss": 0.21391963958740234,
982
+ "eval_runtime": 37.4604,
983
+ "eval_samples_per_second": 36.572,
984
+ "step": 15800
985
  },
986
  {
987
  "epoch": 1.86,
988
  "learning_rate": 0.00011380193180495751,
989
+ "loss": 0.3221,
990
  "step": 16000
991
  },
992
  {
993
  "epoch": 1.86,
994
+ "eval_average_metrics": 90.92335766423358,
995
+ "eval_em": 90.65693430656935,
996
+ "eval_f1": 91.18978102189779,
997
+ "eval_loss": 0.21324890851974487,
998
+ "eval_runtime": 36.0923,
999
+ "eval_samples_per_second": 37.958,
1000
  "step": 16000
1001
  },
1002
+ {
1003
+ "epoch": 1.89,
1004
+ "eval_average_metrics": 90.36374695863748,
1005
+ "eval_em": 90.07299270072993,
1006
+ "eval_f1": 90.65450121654501,
1007
+ "eval_loss": 0.21571427583694458,
1008
+ "eval_runtime": 36.3418,
1009
+ "eval_samples_per_second": 37.698,
1010
+ "step": 16200
1011
+ },
1012
+ {
1013
+ "epoch": 1.91,
1014
+ "eval_average_metrics": 90.58272506082724,
1015
+ "eval_em": 90.2919708029197,
1016
+ "eval_f1": 90.8734793187348,
1017
+ "eval_loss": 0.21374623477458954,
1018
+ "eval_runtime": 35.332,
1019
+ "eval_samples_per_second": 38.775,
1020
+ "step": 16400
1021
+ },
1022
  {
1023
  "epoch": 1.92,
1024
  "learning_rate": 0.00010798324217386244,
1025
+ "loss": 0.3142,
1026
  "step": 16500
1027
  },
1028
  {
1029
+ "epoch": 1.93,
1030
+ "eval_average_metrics": 90.41240875912409,
1031
+ "eval_em": 90.14598540145985,
1032
+ "eval_f1": 90.67883211678833,
1033
+ "eval_loss": 0.21370555460453033,
1034
+ "eval_runtime": 37.2326,
1035
+ "eval_samples_per_second": 36.796,
1036
+ "step": 16600
1037
+ },
1038
+ {
1039
+ "epoch": 1.96,
1040
+ "eval_average_metrics": 89.75547445255475,
1041
+ "eval_em": 89.48905109489051,
1042
+ "eval_f1": 90.02189781021897,
1043
+ "eval_loss": 0.21746164560317993,
1044
+ "eval_runtime": 35.4995,
1045
+ "eval_samples_per_second": 38.592,
1046
+ "step": 16800
1047
  },
1048
  {
1049
  "epoch": 1.98,
1050
  "learning_rate": 0.00010216455254276737,
1051
+ "loss": 0.3206,
1052
  "step": 17000
1053
  },
1054
  {
1055
  "epoch": 1.98,
1056
+ "eval_average_metrics": 89.82846715328466,
1057
+ "eval_em": 89.56204379562044,
1058
+ "eval_f1": 90.0948905109489,
1059
+ "eval_loss": 0.2167847603559494,
1060
+ "eval_runtime": 37.0794,
1061
+ "eval_samples_per_second": 36.948,
1062
  "step": 17000
1063
  },
1064
+ {
1065
+ "epoch": 2.0,
1066
+ "eval_average_metrics": 90.26642335766422,
1067
+ "eval_em": 90.0,
1068
+ "eval_f1": 90.53284671532846,
1069
+ "eval_loss": 0.21559016406536102,
1070
+ "eval_runtime": 37.9031,
1071
+ "eval_samples_per_second": 36.145,
1072
+ "step": 17200
1073
+ },
1074
+ {
1075
+ "epoch": 2.02,
1076
+ "eval_average_metrics": 89.97445255474452,
1077
+ "eval_em": 89.7080291970803,
1078
+ "eval_f1": 90.24087591240874,
1079
+ "eval_loss": 0.21499326825141907,
1080
+ "eval_runtime": 33.4521,
1081
+ "eval_samples_per_second": 40.954,
1082
+ "step": 17400
1083
+ },
1084
  {
1085
  "epoch": 2.04,
1086
  "learning_rate": 9.634586291167229e-05,
1087
+ "loss": 0.3109,
1088
  "step": 17500
1089
  },
1090
  {
1091
+ "epoch": 2.05,
1092
+ "eval_average_metrics": 90.14476885644768,
1093
+ "eval_em": 89.85401459854015,
1094
+ "eval_f1": 90.43552311435523,
1095
+ "eval_loss": 0.21627335250377655,
1096
+ "eval_runtime": 35.646,
1097
+ "eval_samples_per_second": 38.434,
1098
+ "step": 17600
1099
+ },
1100
+ {
1101
+ "epoch": 2.07,
1102
+ "eval_average_metrics": 90.48540145985402,
1103
+ "eval_em": 90.14598540145985,
1104
+ "eval_f1": 90.8248175182482,
1105
+ "eval_loss": 0.21596278250217438,
1106
+ "eval_runtime": 36.6834,
1107
+ "eval_samples_per_second": 37.347,
1108
+ "step": 17800
1109
  },
1110
  {
1111
  "epoch": 2.09,
1112
  "learning_rate": 9.052717328057722e-05,
1113
+ "loss": 0.3035,
1114
  "step": 18000
1115
  },
1116
  {
1117
  "epoch": 2.09,
1118
+ "eval_average_metrics": 89.97445255474453,
1119
+ "eval_em": 89.7080291970803,
1120
+ "eval_f1": 90.24087591240877,
1121
+ "eval_loss": 0.21806372702121735,
1122
+ "eval_runtime": 34.0399,
1123
+ "eval_samples_per_second": 40.247,
1124
  "step": 18000
1125
  },
1126
+ {
1127
+ "epoch": 2.12,
1128
+ "eval_average_metrics": 89.58515815085158,
1129
+ "eval_em": 89.34306569343066,
1130
+ "eval_f1": 89.82725060827251,
1131
+ "eval_loss": 0.2175503671169281,
1132
+ "eval_runtime": 35.3257,
1133
+ "eval_samples_per_second": 38.782,
1134
+ "step": 18200
1135
+ },
1136
+ {
1137
+ "epoch": 2.14,
1138
+ "eval_average_metrics": 90.29075425790754,
1139
+ "eval_em": 90.0,
1140
+ "eval_f1": 90.58150851581509,
1141
+ "eval_loss": 0.21528899669647217,
1142
+ "eval_runtime": 37.4995,
1143
+ "eval_samples_per_second": 36.534,
1144
+ "step": 18400
1145
+ },
1146
  {
1147
  "epoch": 2.15,
1148
  "learning_rate": 8.470848364948212e-05,
1149
+ "loss": 0.3102,
1150
  "step": 18500
1151
  },
1152
  {
1153
+ "epoch": 2.16,
1154
+ "eval_average_metrics": 89.9501216545012,
1155
+ "eval_em": 89.7080291970803,
1156
+ "eval_f1": 90.19221411192213,
1157
+ "eval_loss": 0.21668794751167297,
1158
+ "eval_runtime": 36.8393,
1159
+ "eval_samples_per_second": 37.189,
1160
+ "step": 18600
1161
+ },
1162
+ {
1163
+ "epoch": 2.19,
1164
+ "eval_average_metrics": 90.04744525547446,
1165
+ "eval_em": 89.78102189781022,
1166
+ "eval_f1": 90.31386861313868,
1167
+ "eval_loss": 0.2147464007139206,
1168
+ "eval_runtime": 36.4341,
1169
+ "eval_samples_per_second": 37.602,
1170
+ "step": 18800
1171
  },
1172
  {
1173
  "epoch": 2.21,
1174
  "learning_rate": 7.888979401838705e-05,
1175
+ "loss": 0.2992,
1176
  "step": 19000
1177
  },
1178
  {
1179
  "epoch": 2.21,
1180
+ "eval_average_metrics": 89.56082725060827,
1181
+ "eval_em": 89.34306569343066,
1182
+ "eval_f1": 89.77858880778588,
1183
+ "eval_loss": 0.21566100418567657,
1184
+ "eval_runtime": 37.3837,
1185
+ "eval_samples_per_second": 36.647,
1186
  "step": 19000
1187
  },
1188
+ {
1189
+ "epoch": 2.23,
1190
+ "eval_average_metrics": 89.26885644768856,
1191
+ "eval_em": 89.05109489051095,
1192
+ "eval_f1": 89.48661800486619,
1193
+ "eval_loss": 0.21698147058486938,
1194
+ "eval_runtime": 34.5662,
1195
+ "eval_samples_per_second": 39.634,
1196
+ "step": 19200
1197
+ },
1198
+ {
1199
+ "epoch": 2.26,
1200
+ "eval_average_metrics": 89.9501216545012,
1201
+ "eval_em": 89.7080291970803,
1202
+ "eval_f1": 90.19221411192213,
1203
+ "eval_loss": 0.21671971678733826,
1204
+ "eval_runtime": 39.0865,
1205
+ "eval_samples_per_second": 35.05,
1206
+ "step": 19400
1207
+ },
1208
  {
1209
  "epoch": 2.27,
1210
  "learning_rate": 7.307110438729197e-05,
1211
+ "loss": 0.3104,
1212
  "step": 19500
1213
  },
1214
  {
1215
+ "epoch": 2.28,
1216
+ "eval_average_metrics": 88.92822384428223,
1217
+ "eval_em": 88.6861313868613,
1218
+ "eval_f1": 89.17031630170315,
1219
+ "eval_loss": 0.21831820905208588,
1220
+ "eval_runtime": 38.0065,
1221
+ "eval_samples_per_second": 36.046,
1222
+ "step": 19600
1223
+ },
1224
+ {
1225
+ "epoch": 2.3,
1226
+ "eval_average_metrics": 89.82846715328466,
1227
+ "eval_em": 89.56204379562044,
1228
+ "eval_f1": 90.09489051094889,
1229
+ "eval_loss": 0.2175111472606659,
1230
+ "eval_runtime": 38.7133,
1231
+ "eval_samples_per_second": 35.388,
1232
+ "step": 19800
1233
  },
1234
  {
1235
  "epoch": 2.33,
1236
  "learning_rate": 6.72524147561969e-05,
1237
+ "loss": 0.299,
1238
  "step": 20000
1239
  },
1240
  {
1241
  "epoch": 2.33,
1242
+ "eval_average_metrics": 90.04744525547446,
1243
+ "eval_em": 89.78102189781022,
1244
+ "eval_f1": 90.31386861313868,
1245
+ "eval_loss": 0.21775414049625397,
1246
+ "eval_runtime": 37.1614,
1247
+ "eval_samples_per_second": 36.866,
1248
  "step": 20000
1249
  },
1250
+ {
1251
+ "epoch": 2.35,
1252
+ "eval_average_metrics": 90.33941605839416,
1253
+ "eval_em": 90.07299270072993,
1254
+ "eval_f1": 90.60583941605839,
1255
+ "eval_loss": 0.21791471540927887,
1256
+ "eval_runtime": 38.7185,
1257
+ "eval_samples_per_second": 35.384,
1258
+ "step": 20200
1259
+ },
1260
+ {
1261
+ "epoch": 2.37,
1262
+ "eval_average_metrics": 90.85036496350364,
1263
+ "eval_em": 90.58394160583941,
1264
+ "eval_f1": 91.11678832116786,
1265
+ "eval_loss": 0.21669700741767883,
1266
+ "eval_runtime": 36.9688,
1267
+ "eval_samples_per_second": 37.058,
1268
+ "step": 20400
1269
+ },
1270
  {
1271
  "epoch": 2.39,
1272
  "learning_rate": 6.143372512510183e-05,
1273
+ "loss": 0.3106,
1274
  "step": 20500
1275
  },
1276
  {
1277
+ "epoch": 2.4,
1278
+ "eval_average_metrics": 90.99635036496349,
1279
+ "eval_em": 90.72992700729927,
1280
+ "eval_f1": 91.26277372262773,
1281
+ "eval_loss": 0.21628382802009583,
1282
+ "eval_runtime": 36.1926,
1283
+ "eval_samples_per_second": 37.853,
1284
+ "step": 20600
1285
+ },
1286
+ {
1287
+ "epoch": 2.42,
1288
+ "eval_average_metrics": 90.485401459854,
1289
+ "eval_em": 90.21897810218978,
1290
+ "eval_f1": 90.75182481751823,
1291
+ "eval_loss": 0.2179671972990036,
1292
+ "eval_runtime": 35.7701,
1293
+ "eval_samples_per_second": 38.3,
1294
+ "step": 20800
1295
  },
1296
  {
1297
  "epoch": 2.44,
1298
  "learning_rate": 5.561503549400675e-05,
1299
+ "loss": 0.3131,
1300
  "step": 21000
1301
  },
1302
  {
1303
  "epoch": 2.44,
1304
+ "eval_average_metrics": 89.90145985401459,
1305
+ "eval_em": 89.63503649635037,
1306
+ "eval_f1": 90.16788321167881,
1307
+ "eval_loss": 0.21815823018550873,
1308
+ "eval_runtime": 38.6202,
1309
+ "eval_samples_per_second": 35.474,
1310
  "step": 21000
1311
  },
1312
+ {
1313
+ "epoch": 2.47,
1314
+ "eval_average_metrics": 89.81386861313868,
1315
+ "eval_em": 89.48905109489051,
1316
+ "eval_f1": 90.13868613138686,
1317
+ "eval_loss": 0.21742023527622223,
1318
+ "eval_runtime": 38.6698,
1319
+ "eval_samples_per_second": 35.428,
1320
+ "step": 21200
1321
+ },
1322
+ {
1323
+ "epoch": 2.49,
1324
+ "eval_average_metrics": 90.54379562043796,
1325
+ "eval_em": 90.21897810218978,
1326
+ "eval_f1": 90.86861313868614,
1327
+ "eval_loss": 0.21656812727451324,
1328
+ "eval_runtime": 37.7889,
1329
+ "eval_samples_per_second": 36.254,
1330
+ "step": 21400
1331
+ },
1332
  {
1333
  "epoch": 2.5,
1334
  "learning_rate": 4.9796345862911663e-05,
1335
+ "loss": 0.3109,
1336
  "step": 21500
1337
  },
1338
  {
1339
+ "epoch": 2.51,
1340
+ "eval_average_metrics": 90.47080291970804,
1341
+ "eval_em": 90.14598540145985,
1342
+ "eval_f1": 90.79562043795622,
1343
+ "eval_loss": 0.21554183959960938,
1344
+ "eval_runtime": 40.3847,
1345
+ "eval_samples_per_second": 33.924,
1346
+ "step": 21600
1347
+ },
1348
+ {
1349
+ "epoch": 2.54,
1350
+ "eval_average_metrics": 90.55839416058393,
1351
+ "eval_em": 90.2919708029197,
1352
+ "eval_f1": 90.82481751824815,
1353
+ "eval_loss": 0.21551626920700073,
1354
+ "eval_runtime": 40.9505,
1355
+ "eval_samples_per_second": 33.455,
1356
+ "step": 21800
1357
  },
1358
  {
1359
  "epoch": 2.56,
1360
  "learning_rate": 4.397765623181659e-05,
1361
+ "loss": 0.3139,
1362
  "step": 22000
1363
  },
1364
  {
1365
  "epoch": 2.56,
1366
+ "eval_average_metrics": 90.53406326034063,
1367
+ "eval_em": 90.21897810218978,
1368
+ "eval_f1": 90.84914841849148,
1369
+ "eval_loss": 0.21652992069721222,
1370
+ "eval_runtime": 39.2455,
1371
+ "eval_samples_per_second": 34.908,
1372
  "step": 22000
1373
  },
1374
+ {
1375
+ "epoch": 2.58,
1376
+ "eval_average_metrics": 90.38807785888076,
1377
+ "eval_em": 90.07299270072993,
1378
+ "eval_f1": 90.70316301703161,
1379
+ "eval_loss": 0.2176700383424759,
1380
+ "eval_runtime": 39.6231,
1381
+ "eval_samples_per_second": 34.576,
1382
+ "step": 22200
1383
+ },
1384
+ {
1385
+ "epoch": 2.61,
1386
+ "eval_average_metrics": 90.82603406326034,
1387
+ "eval_em": 90.51094890510949,
1388
+ "eval_f1": 91.14111922141119,
1389
+ "eval_loss": 0.21595974266529083,
1390
+ "eval_runtime": 38.5872,
1391
+ "eval_samples_per_second": 35.504,
1392
+ "step": 22400
1393
+ },
1394
  {
1395
  "epoch": 2.62,
1396
  "learning_rate": 3.815896660072152e-05,
1397
+ "loss": 0.3012,
1398
  "step": 22500
1399
  },
1400
  {
1401
+ "epoch": 2.63,
1402
+ "eval_average_metrics": 90.60705596107056,
1403
+ "eval_em": 90.2919708029197,
1404
+ "eval_f1": 90.9221411192214,
1405
+ "eval_loss": 0.2160317748785019,
1406
+ "eval_runtime": 38.122,
1407
+ "eval_samples_per_second": 35.937,
1408
+ "step": 22600
1409
+ },
1410
+ {
1411
+ "epoch": 2.65,
1412
+ "eval_average_metrics": 90.65571776155718,
1413
+ "eval_em": 90.36496350364963,
1414
+ "eval_f1": 90.94647201946472,
1415
+ "eval_loss": 0.21644768118858337,
1416
+ "eval_runtime": 34.8398,
1417
+ "eval_samples_per_second": 39.323,
1418
+ "step": 22800
1419
  },
1420
  {
1421
  "epoch": 2.68,
1422
  "learning_rate": 3.234027696962644e-05,
1423
+ "loss": 0.3084,
1424
  "step": 23000
1425
  },
1426
  {
1427
  "epoch": 2.68,
1428
+ "eval_average_metrics": 90.169099756691,
1429
+ "eval_em": 89.85401459854015,
1430
+ "eval_f1": 90.48418491484183,
1431
+ "eval_loss": 0.21626520156860352,
1432
+ "eval_runtime": 34.9713,
1433
+ "eval_samples_per_second": 39.175,
1434
  "step": 23000
1435
  },
1436
+ {
1437
+ "epoch": 2.7,
1438
+ "eval_average_metrics": 89.58515815085158,
1439
+ "eval_em": 89.27007299270073,
1440
+ "eval_f1": 89.90024330900242,
1441
+ "eval_loss": 0.2173507809638977,
1442
+ "eval_runtime": 34.5287,
1443
+ "eval_samples_per_second": 39.677,
1444
+ "step": 23200
1445
+ },
1446
+ {
1447
+ "epoch": 2.72,
1448
+ "eval_average_metrics": 89.58515815085158,
1449
+ "eval_em": 89.27007299270073,
1450
+ "eval_f1": 89.90024330900242,
1451
+ "eval_loss": 0.21798554062843323,
1452
+ "eval_runtime": 32.6335,
1453
+ "eval_samples_per_second": 41.981,
1454
+ "step": 23400
1455
+ },
1456
  {
1457
  "epoch": 2.73,
1458
  "learning_rate": 2.6521587338531362e-05,
1459
+ "loss": 0.3034,
1460
  "step": 23500
1461
  },
1462
  {
1463
+ "epoch": 2.75,
1464
+ "eval_average_metrics": 89.6581508515815,
1465
+ "eval_em": 89.34306569343066,
1466
+ "eval_f1": 89.97323600973235,
1467
+ "eval_loss": 0.2169240415096283,
1468
+ "eval_runtime": 31.2981,
1469
+ "eval_samples_per_second": 43.773,
1470
+ "step": 23600
1471
+ },
1472
+ {
1473
+ "epoch": 2.77,
1474
+ "eval_average_metrics": 90.02311435523114,
1475
+ "eval_em": 89.7080291970803,
1476
+ "eval_f1": 90.338199513382,
1477
+ "eval_loss": 0.2169690728187561,
1478
+ "eval_runtime": 31.3076,
1479
+ "eval_samples_per_second": 43.759,
1480
+ "step": 23800
1481
  },
1482
  {
1483
  "epoch": 2.79,
1484
  "learning_rate": 2.0702897707436283e-05,
1485
+ "loss": 0.3087,
1486
  "step": 24000
1487
  },
1488
  {
1489
  "epoch": 2.79,
1490
+ "eval_average_metrics": 90.53406326034063,
1491
+ "eval_em": 90.21897810218978,
1492
+ "eval_f1": 90.84914841849148,
1493
+ "eval_loss": 0.2168567031621933,
1494
+ "eval_runtime": 32.1016,
1495
+ "eval_samples_per_second": 42.677,
1496
  "step": 24000
1497
  },
1498
+ {
1499
+ "epoch": 2.82,
1500
+ "eval_average_metrics": 90.169099756691,
1501
+ "eval_em": 89.85401459854015,
1502
+ "eval_f1": 90.48418491484183,
1503
+ "eval_loss": 0.21707168221473694,
1504
+ "eval_runtime": 34.5668,
1505
+ "eval_samples_per_second": 39.633,
1506
+ "step": 24200
1507
+ },
1508
+ {
1509
+ "epoch": 2.84,
1510
+ "eval_average_metrics": 90.169099756691,
1511
+ "eval_em": 89.85401459854015,
1512
+ "eval_f1": 90.48418491484183,
1513
+ "eval_loss": 0.2168397605419159,
1514
+ "eval_runtime": 35.1948,
1515
+ "eval_samples_per_second": 38.926,
1516
+ "step": 24400
1517
+ },
1518
  {
1519
  "epoch": 2.85,
1520
  "learning_rate": 1.4884208076341207e-05,
1521
+ "loss": 0.3038,
1522
  "step": 24500
1523
  },
1524
  {
1525
+ "epoch": 2.86,
1526
+ "eval_average_metrics": 89.14720194647202,
1527
+ "eval_em": 88.83211678832117,
1528
+ "eval_f1": 89.46228710462286,
1529
+ "eval_loss": 0.21729852259159088,
1530
+ "eval_runtime": 35.4024,
1531
+ "eval_samples_per_second": 38.698,
1532
+ "step": 24600
1533
+ },
1534
+ {
1535
+ "epoch": 2.89,
1536
+ "eval_average_metrics": 89.99878345498783,
1537
+ "eval_em": 89.7080291970803,
1538
+ "eval_f1": 90.28953771289538,
1539
+ "eval_loss": 0.21667222678661346,
1540
+ "eval_runtime": 34.8507,
1541
+ "eval_samples_per_second": 39.311,
1542
+ "step": 24800
1543
  },
1544
  {
1545
  "epoch": 2.91,
1546
  "learning_rate": 9.065518445246129e-06,
1547
+ "loss": 0.3083,
1548
  "step": 25000
1549
  },
1550
  {
1551
  "epoch": 2.91,
1552
+ "eval_average_metrics": 90.21776155717762,
1553
+ "eval_em": 89.92700729927007,
1554
+ "eval_f1": 90.50851581508516,
1555
+ "eval_loss": 0.216518834233284,
1556
+ "eval_runtime": 34.7968,
1557
+ "eval_samples_per_second": 39.371,
1558
  "step": 25000
1559
  },
1560
+ {
1561
+ "epoch": 2.93,
1562
+ "eval_average_metrics": 90.07177615571777,
1563
+ "eval_em": 89.78102189781022,
1564
+ "eval_f1": 90.36253041362531,
1565
+ "eval_loss": 0.21596592664718628,
1566
+ "eval_runtime": 34.8982,
1567
+ "eval_samples_per_second": 39.257,
1568
+ "step": 25200
1569
+ },
1570
+ {
1571
+ "epoch": 2.96,
1572
+ "eval_average_metrics": 90.07177615571777,
1573
+ "eval_em": 89.78102189781022,
1574
+ "eval_f1": 90.36253041362531,
1575
+ "eval_loss": 0.21597927808761597,
1576
+ "eval_runtime": 35.1856,
1577
+ "eval_samples_per_second": 38.936,
1578
+ "step": 25400
1579
+ },
1580
  {
1581
  "epoch": 2.97,
1582
  "learning_rate": 3.2468288141510528e-06,
1583
+ "loss": 0.3048,
1584
  "step": 25500
1585
  },
1586
  {
1587
+ "epoch": 2.98,
1588
+ "eval_average_metrics": 90.07177615571777,
1589
+ "eval_em": 89.78102189781022,
1590
  "eval_f1": 90.36253041362531,
1591
+ "eval_loss": 0.21600975096225739,
1592
+ "eval_runtime": 33.008,
1593
+ "eval_samples_per_second": 41.505,
1594
+ "step": 25600
1595
  },
1596
  {
1597
  "epoch": 3.0,
1598
  "step": 25779,
1599
+ "total_flos": 2.1177253912543027e+17,
1600
+ "train_loss": 0.3175360437943145,
1601
+ "train_runtime": 17672.1841,
1602
+ "train_samples_per_second": 23.339,
1603
+ "train_steps_per_second": 1.459
1604
  }
1605
  ],
1606
  "max_steps": 25779,
1607
  "num_train_epochs": 3,
1608
+ "total_flos": 2.1177253912543027e+17,
1609
  "trial_name": null,
1610
  "trial_params": null
1611
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a9fc0b2c802946c2d87bb004854bb82ca322e9997328e616e2973d3f37a9dacc
3
  size 3183
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b54ef46ceeb8bfabb09b43e3ec6d062336e479231fa78b4d934c2be81827529
3
  size 3183
training_config.json CHANGED
@@ -1 +1 @@
1
- {"bottleneck_dim": 24, "dataset_config_name": ["en"], "delta_type": "adapter", "do_eval": true, "do_test": true, "do_train": true, "eval_dataset_config_name": ["en"], "eval_dataset_name": "superglue-record", "eval_steps": 200, "evaluation_strategy": "steps", "greater_is_better": true, "learning_rate": 0.0003, "load_best_model_at_end": true, "max_source_length": 512, "metric_for_best_model": "average_metrics", "model_name_or_path": "../../../../plm_cache/t5-base", "num_train_epochs": 3, "output_dir": "outputs/bitfit/t5-base/superglue-record", "overwrite_output_dir": true, "per_device_eval_batch_size": 16, "per_device_train_batch_size": 16, "predict_with_generate": true, "push_to_hub": true, "save_steps": 200, "save_strategy": "steps", "save_total_limit": 1, "seed": 42, "split_validation_test": true, "task_name": "superglue-record", "test_dataset_config_name": ["en"], "test_dataset_name": "superglue-record", "tokenizer_name": "../../../../plm_cache/t5-base", "unfrozen_modules": ["deltas", "layer_norm", "final_layer_norm"], "warmup_steps": 0}
 
1
+ {"dataset_config_name": ["en"], "delta_type": "lora", "do_eval": true, "do_test": true, "do_train": true, "eval_dataset_config_name": ["en"], "eval_dataset_name": "superglue-record", "eval_steps": 200, "evaluation_strategy": "steps", "greater_is_better": true, "learning_rate": 0.0003, "load_best_model_at_end": true, "lora_r": 8, "max_source_length": 512, "metric_for_best_model": "average_metrics", "model_name_or_path": "../../../../plm_cache/t5-base", "num_train_epochs": 3, "output_dir": "outputs/bitfit/t5-base/superglue-record", "overwrite_output_dir": true, "per_device_eval_batch_size": 16, "per_device_train_batch_size": 16, "predict_with_generate": true, "push_to_hub": true, "save_steps": 200, "save_strategy": "steps", "save_total_limit": 1, "seed": 42, "split_validation_test": true, "task_name": "superglue-record", "test_dataset_config_name": ["en"], "test_dataset_name": "superglue-record", "tokenizer_name": "../../../../plm_cache/t5-base", "unfrozen_modules": ["deltas", "layer_norm", "final_layer_norm"], "warmup_steps": 0}