thomaslim6793 commited on
Commit
551fe86
·
verified ·
1 Parent(s): d5d9722

Update multitask INDRA statement classifier

Browse files
all_results.json CHANGED
@@ -1,28 +1,28 @@
1
  {
2
  "epoch": 10.0,
3
- "eval_gate1_accuracy": 0.9213647144681627,
4
- "eval_gate1_f1": 0.9186345562318086,
5
- "eval_gate1_precision": 0.9201991431515453,
6
- "eval_gate1_recall": 0.917244999785811,
7
- "eval_gate1_support": 5481,
8
- "eval_gate2_accuracy": 0.8666301769750046,
9
- "eval_gate2_f1": 0.8084870586267471,
10
- "eval_gate2_precision": 0.8025086025493519,
11
- "eval_gate2_recall": 0.8192604428212116,
12
- "eval_gate2_support": 5481,
13
- "eval_gate3_accuracy": 0.896040316774658,
14
- "eval_gate3_f1": 0.7248294888969216,
15
- "eval_gate3_precision": 0.7283732815204376,
16
- "eval_gate3_recall": 0.7292579147184429,
17
  "eval_gate3_support": 6945,
18
- "eval_gate4_span_FN": 191,
19
- "eval_gate4_span_FP": 216,
20
- "eval_gate4_span_TP": 820,
21
- "eval_gate4_span_f1": 0.8011724424770412,
22
- "eval_gate4_span_precision": 0.7915057914981516,
23
- "eval_gate4_span_recall": 0.8110781404469725,
24
  "eval_loss": NaN,
25
- "eval_runtime": 11.7731,
26
- "eval_samples_per_second": 1141.924,
27
- "eval_steps_per_second": 35.759
28
  }
 
1
  {
2
  "epoch": 10.0,
3
+ "eval_gate1_accuracy": 0.9251295336787565,
4
+ "eval_gate1_f1": 0.9199371922438249,
5
+ "eval_gate1_precision": 0.920966070966071,
6
+ "eval_gate1_recall": 0.9189513092953367,
7
+ "eval_gate1_support": 3860,
8
+ "eval_gate2_accuracy": 0.8709844559585492,
9
+ "eval_gate2_f1": 0.8487797208181732,
10
+ "eval_gate2_precision": 0.8500529357712848,
11
+ "eval_gate2_recall": 0.8532136788618205,
12
+ "eval_gate2_support": 3860,
13
+ "eval_gate3_accuracy": 0.8920086393088553,
14
+ "eval_gate3_f1": 0.6992827001481418,
15
+ "eval_gate3_precision": 0.715591871957983,
16
+ "eval_gate3_recall": 0.7063340262769819,
17
  "eval_gate3_support": 6945,
18
+ "eval_gate4_span_FN": 196,
19
+ "eval_gate4_span_FP": 204,
20
+ "eval_gate4_span_TP": 815,
21
+ "eval_gate4_span_f1": 0.8029556600167974,
22
+ "eval_gate4_span_precision": 0.7998037291383728,
23
+ "eval_gate4_span_recall": 0.8061325420296129,
24
  "eval_loss": NaN,
25
+ "eval_runtime": 10.4274,
26
+ "eval_samples_per_second": 1133.841,
27
+ "eval_steps_per_second": 35.483
28
  }
eval_results.json CHANGED
@@ -1,28 +1,28 @@
1
  {
2
  "epoch": 10.0,
3
- "eval_gate1_accuracy": 0.9246350364963504,
4
- "eval_gate1_f1": 0.9205333497188853,
5
- "eval_gate1_precision": 0.9217073986882154,
6
- "eval_gate1_recall": 0.9194276042067187,
7
- "eval_gate1_support": 5480,
8
- "eval_gate2_accuracy": 0.8678832116788321,
9
- "eval_gate2_f1": 0.8058316251370092,
10
- "eval_gate2_precision": 0.8166158136605832,
11
- "eval_gate2_recall": 0.7978233842024146,
12
- "eval_gate2_support": 5480,
13
- "eval_gate3_accuracy": 0.8917206623470122,
14
- "eval_gate3_f1": 0.8222395535726833,
15
- "eval_gate3_precision": 0.8221736195559818,
16
- "eval_gate3_recall": 0.8242704639947701,
17
  "eval_gate3_support": 6945,
18
- "eval_gate4_span_FN": 203,
19
- "eval_gate4_span_FP": 229,
20
- "eval_gate4_span_TP": 804,
21
- "eval_gate4_span_f1": 0.7882352891107315,
22
- "eval_gate4_span_precision": 0.7783155856652633,
23
- "eval_gate4_span_recall": 0.7984111221370565,
24
  "eval_loss": NaN,
25
- "eval_runtime": 11.7348,
26
- "eval_samples_per_second": 1145.568,
27
- "eval_steps_per_second": 35.876
28
  }
 
1
  {
2
  "epoch": 10.0,
3
+ "eval_gate1_accuracy": 0.9217413837781808,
4
+ "eval_gate1_f1": 0.9163582001286115,
5
+ "eval_gate1_precision": 0.9168310136033854,
6
+ "eval_gate1_recall": 0.915894857280501,
7
+ "eval_gate1_support": 3859,
8
+ "eval_gate2_accuracy": 0.8717284270536408,
9
+ "eval_gate2_f1": 0.8542694094275488,
10
+ "eval_gate2_precision": 0.8495135391288109,
11
+ "eval_gate2_recall": 0.8711254994444528,
12
+ "eval_gate2_support": 3859,
13
+ "eval_gate3_accuracy": 0.8866810655147588,
14
+ "eval_gate3_f1": 0.8118642371342876,
15
+ "eval_gate3_precision": 0.8115033608543574,
16
+ "eval_gate3_recall": 0.8169535217733972,
17
  "eval_gate3_support": 6945,
18
+ "eval_gate4_span_FN": 216,
19
+ "eval_gate4_span_FP": 233,
20
+ "eval_gate4_span_TP": 791,
21
+ "eval_gate4_span_f1": 0.7789266321172492,
22
+ "eval_gate4_span_precision": 0.7724609374924565,
23
+ "eval_gate4_span_recall": 0.7855014895651886,
24
  "eval_loss": NaN,
25
+ "eval_runtime": 10.4531,
26
+ "eval_samples_per_second": 1130.954,
27
+ "eval_steps_per_second": 35.396
28
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b94cf322393ef80a1b785e7df572a818dbac55f2398d890d3892bc064ab2d1d3
3
  size 433117924
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b35d7f66fff3ea1f61adafef612dc54cbec880bc1382a940ef331aa3566de4e
3
  size 433117924
test_results.json CHANGED
@@ -1,28 +1,28 @@
1
  {
2
  "epoch": 10.0,
3
- "eval_gate1_accuracy": 0.9213647144681627,
4
- "eval_gate1_f1": 0.9186345562318086,
5
- "eval_gate1_precision": 0.9201991431515453,
6
- "eval_gate1_recall": 0.917244999785811,
7
- "eval_gate1_support": 5481,
8
- "eval_gate2_accuracy": 0.8666301769750046,
9
- "eval_gate2_f1": 0.8084870586267471,
10
- "eval_gate2_precision": 0.8025086025493519,
11
- "eval_gate2_recall": 0.8192604428212116,
12
- "eval_gate2_support": 5481,
13
- "eval_gate3_accuracy": 0.896040316774658,
14
- "eval_gate3_f1": 0.7248294888969216,
15
- "eval_gate3_precision": 0.7283732815204376,
16
- "eval_gate3_recall": 0.7292579147184429,
17
  "eval_gate3_support": 6945,
18
- "eval_gate4_span_FN": 191,
19
- "eval_gate4_span_FP": 216,
20
- "eval_gate4_span_TP": 820,
21
- "eval_gate4_span_f1": 0.8011724424770412,
22
- "eval_gate4_span_precision": 0.7915057914981516,
23
- "eval_gate4_span_recall": 0.8110781404469725,
24
  "eval_loss": NaN,
25
- "eval_runtime": 11.7731,
26
- "eval_samples_per_second": 1141.924,
27
- "eval_steps_per_second": 35.759
28
  }
 
1
  {
2
  "epoch": 10.0,
3
+ "eval_gate1_accuracy": 0.9251295336787565,
4
+ "eval_gate1_f1": 0.9199371922438249,
5
+ "eval_gate1_precision": 0.920966070966071,
6
+ "eval_gate1_recall": 0.9189513092953367,
7
+ "eval_gate1_support": 3860,
8
+ "eval_gate2_accuracy": 0.8709844559585492,
9
+ "eval_gate2_f1": 0.8487797208181732,
10
+ "eval_gate2_precision": 0.8500529357712848,
11
+ "eval_gate2_recall": 0.8532136788618205,
12
+ "eval_gate2_support": 3860,
13
+ "eval_gate3_accuracy": 0.8920086393088553,
14
+ "eval_gate3_f1": 0.6992827001481418,
15
+ "eval_gate3_precision": 0.715591871957983,
16
+ "eval_gate3_recall": 0.7063340262769819,
17
  "eval_gate3_support": 6945,
18
+ "eval_gate4_span_FN": 196,
19
+ "eval_gate4_span_FP": 204,
20
+ "eval_gate4_span_TP": 815,
21
+ "eval_gate4_span_f1": 0.8029556600167974,
22
+ "eval_gate4_span_precision": 0.7998037291383728,
23
+ "eval_gate4_span_recall": 0.8061325420296129,
24
  "eval_loss": NaN,
25
+ "eval_runtime": 10.4274,
26
+ "eval_samples_per_second": 1133.841,
27
+ "eval_steps_per_second": 35.483
28
  }
trainer_state.json CHANGED
@@ -1,444 +1,444 @@
1
  {
2
- "best_global_step": 33610,
3
- "best_metric": 0.9205333497188853,
4
- "best_model_checkpoint": "output/indra_stmt_classifier/checkpoint-33610",
5
  "epoch": 10.0,
6
  "eval_steps": 500,
7
- "global_step": 33610,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
11
  "log_history": [
12
  {
13
  "epoch": 1.0,
14
- "grad_norm": 83.16195678710938,
15
- "learning_rate": 2.7000892591490628e-05,
16
- "loss": 2.1713,
17
- "step": 3361
18
  },
19
  {
20
  "epoch": 1.0,
21
- "eval_gate1_accuracy": 0.8631386861313869,
22
- "eval_gate1_f1": 0.8496391119181088,
23
- "eval_gate1_precision": 0.8747726787205531,
24
- "eval_gate1_recall": 0.8378801625011154,
25
- "eval_gate1_support": 5480,
26
- "eval_gate2_accuracy": 0.7735401459854014,
27
- "eval_gate2_f1": 0.5551258278523046,
28
- "eval_gate2_precision": 0.5319036721194055,
29
- "eval_gate2_recall": 0.5990167093747056,
30
- "eval_gate2_support": 5480,
31
- "eval_gate3_accuracy": 0.8374370050395968,
32
- "eval_gate3_f1": 0.7282978571600487,
33
- "eval_gate3_precision": 0.6996136908126558,
34
- "eval_gate3_recall": 0.7783567551416212,
35
  "eval_gate3_support": 6945,
36
- "eval_gate4_span_FN": 253,
37
- "eval_gate4_span_FP": 367,
38
- "eval_gate4_span_TP": 754,
39
- "eval_gate4_span_f1": 0.7086466115490427,
40
- "eval_gate4_span_precision": 0.6726137377281659,
41
- "eval_gate4_span_recall": 0.7487586891683341,
42
  "eval_loss": NaN,
43
- "eval_runtime": 11.786,
44
- "eval_samples_per_second": 1140.592,
45
- "eval_steps_per_second": 35.72,
46
- "step": 3361
47
  },
48
  {
49
  "epoch": 2.0,
50
- "grad_norm": 69.370361328125,
51
- "learning_rate": 2.400089259149063e-05,
52
- "loss": 1.1877,
53
- "step": 6722
54
  },
55
  {
56
  "epoch": 2.0,
57
- "eval_gate1_accuracy": 0.9047445255474452,
58
- "eval_gate1_f1": 0.8993560611817873,
59
- "eval_gate1_precision": 0.901382455631206,
60
- "eval_gate1_recall": 0.8975327738550425,
61
- "eval_gate1_support": 5480,
62
- "eval_gate2_accuracy": 0.8321167883211679,
63
- "eval_gate2_f1": 0.6987395582230196,
64
- "eval_gate2_precision": 0.7745717741282553,
65
- "eval_gate2_recall": 0.6797882368167423,
66
- "eval_gate2_support": 5480,
67
- "eval_gate3_accuracy": 0.874154067674586,
68
- "eval_gate3_f1": 0.7533275258899098,
69
- "eval_gate3_precision": 0.7684785876654326,
70
- "eval_gate3_recall": 0.7543369804146175,
71
  "eval_gate3_support": 6945,
72
- "eval_gate4_span_FN": 249,
73
- "eval_gate4_span_FP": 225,
74
- "eval_gate4_span_TP": 758,
75
- "eval_gate4_span_f1": 0.7618090402192016,
76
- "eval_gate4_span_precision": 0.7711088504499378,
77
- "eval_gate4_span_recall": 0.7527308838058319,
78
  "eval_loss": NaN,
79
- "eval_runtime": 11.7456,
80
- "eval_samples_per_second": 1144.515,
81
- "eval_steps_per_second": 35.843,
82
- "step": 6722
83
  },
84
  {
85
  "epoch": 3.0,
86
- "grad_norm": 45.90858840942383,
87
- "learning_rate": 2.1000892591490628e-05,
88
- "loss": 0.826,
89
- "step": 10083
90
  },
91
  {
92
  "epoch": 3.0,
93
- "eval_gate1_accuracy": 0.9078467153284672,
94
- "eval_gate1_f1": 0.9015973942404003,
95
- "eval_gate1_precision": 0.9092105636457223,
96
- "eval_gate1_recall": 0.8959912039961053,
97
- "eval_gate1_support": 5480,
98
- "eval_gate2_accuracy": 0.8341240875912409,
99
- "eval_gate2_f1": 0.7503015413052768,
100
- "eval_gate2_precision": 0.7476103243098973,
101
- "eval_gate2_recall": 0.7641146716016405,
102
- "eval_gate2_support": 5480,
103
- "eval_gate3_accuracy": 0.8768898488120951,
104
- "eval_gate3_f1": 0.7962252395628027,
105
- "eval_gate3_precision": 0.7770154690688454,
106
- "eval_gate3_recall": 0.8213925119331326,
107
  "eval_gate3_support": 6945,
108
- "eval_gate4_span_FN": 246,
109
- "eval_gate4_span_FP": 169,
110
- "eval_gate4_span_TP": 761,
111
- "eval_gate4_span_f1": 0.7857511565898759,
112
- "eval_gate4_span_precision": 0.8182795698836745,
113
- "eval_gate4_span_recall": 0.7557100297839552,
114
  "eval_loss": NaN,
115
- "eval_runtime": 11.7657,
116
- "eval_samples_per_second": 1142.558,
117
- "eval_steps_per_second": 35.782,
118
- "step": 10083
119
  },
120
  {
121
  "epoch": 4.0,
122
- "grad_norm": 71.82106018066406,
123
- "learning_rate": 1.800089259149063e-05,
124
- "loss": 0.6078,
125
- "step": 13444
126
  },
127
  {
128
  "epoch": 4.0,
129
- "eval_gate1_accuracy": 0.9158759124087591,
130
- "eval_gate1_f1": 0.9110773857438494,
131
- "eval_gate1_precision": 0.9133749733155683,
132
- "eval_gate1_recall": 0.9090260872756438,
133
- "eval_gate1_support": 5480,
134
- "eval_gate2_accuracy": 0.8534671532846715,
135
- "eval_gate2_f1": 0.779756506272741,
136
- "eval_gate2_precision": 0.7797552394455943,
137
- "eval_gate2_recall": 0.7841918455268236,
138
- "eval_gate2_support": 5480,
139
- "eval_gate3_accuracy": 0.8781857451403887,
140
- "eval_gate3_f1": 0.7971838058377029,
141
- "eval_gate3_precision": 0.7985875511812209,
142
- "eval_gate3_recall": 0.7998701853370004,
143
  "eval_gate3_support": 6945,
144
- "eval_gate4_span_FN": 235,
145
- "eval_gate4_span_FP": 174,
146
- "eval_gate4_span_TP": 772,
147
- "eval_gate4_span_f1": 0.7905785920269918,
148
- "eval_gate4_span_precision": 0.8160676532683291,
149
- "eval_gate4_span_recall": 0.7666335650370741,
150
  "eval_loss": NaN,
151
- "eval_runtime": 11.7533,
152
- "eval_samples_per_second": 1143.759,
153
- "eval_steps_per_second": 35.82,
154
- "step": 13444
155
  },
156
  {
157
  "epoch": 5.0,
158
- "grad_norm": 24.64365577697754,
159
- "learning_rate": 1.5000892591490627e-05,
160
- "loss": 0.4578,
161
- "step": 16805
162
  },
163
  {
164
  "epoch": 5.0,
165
- "eval_gate1_accuracy": 0.9211678832116789,
166
- "eval_gate1_f1": 0.9164362394274561,
167
- "eval_gate1_precision": 0.920180620585261,
168
- "eval_gate1_recall": 0.9132733009849491,
169
- "eval_gate1_support": 5480,
170
- "eval_gate2_accuracy": 0.8596715328467154,
171
- "eval_gate2_f1": 0.7821118981569934,
172
- "eval_gate2_precision": 0.7823810326487586,
173
- "eval_gate2_recall": 0.7874741213438188,
174
- "eval_gate2_support": 5480,
175
- "eval_gate3_accuracy": 0.8879769618430525,
176
- "eval_gate3_f1": 0.8188009781259479,
177
- "eval_gate3_precision": 0.81704667818362,
178
- "eval_gate3_recall": 0.8239144912824204,
179
  "eval_gate3_support": 6945,
180
- "eval_gate4_span_FN": 192,
181
- "eval_gate4_span_FP": 238,
182
- "eval_gate4_span_TP": 815,
183
- "eval_gate4_span_f1": 0.7912621309171413,
184
- "eval_gate4_span_precision": 0.7739791073050905,
185
- "eval_gate4_span_recall": 0.8093346573901754,
186
  "eval_loss": NaN,
187
- "eval_runtime": 11.7427,
188
- "eval_samples_per_second": 1144.794,
189
- "eval_steps_per_second": 35.852,
190
- "step": 16805
191
  },
192
  {
193
  "epoch": 6.0,
194
- "grad_norm": 69.29522705078125,
195
- "learning_rate": 1.2000892591490627e-05,
196
- "loss": 0.3524,
197
- "step": 20166
198
  },
199
  {
200
  "epoch": 6.0,
201
- "eval_gate1_accuracy": 0.9231751824817518,
202
- "eval_gate1_f1": 0.9190504806785601,
203
- "eval_gate1_precision": 0.9199059164357939,
204
- "eval_gate1_recall": 0.9182325041170862,
205
- "eval_gate1_support": 5480,
206
- "eval_gate2_accuracy": 0.8636861313868613,
207
- "eval_gate2_f1": 0.7930432865271577,
208
- "eval_gate2_precision": 0.8121456104731711,
209
- "eval_gate2_recall": 0.7841299101269683,
210
- "eval_gate2_support": 5480,
211
- "eval_gate3_accuracy": 0.8920086393088553,
212
- "eval_gate3_f1": 0.8088394881064588,
213
- "eval_gate3_precision": 0.8180765356300564,
214
- "eval_gate3_recall": 0.8033490259257916,
215
  "eval_gate3_support": 6945,
216
- "eval_gate4_span_FN": 225,
217
- "eval_gate4_span_FP": 200,
218
- "eval_gate4_span_TP": 782,
219
- "eval_gate4_span_f1": 0.7863247813176696,
220
- "eval_gate4_span_precision": 0.79633401221185,
221
- "eval_gate4_span_recall": 0.7765640516308187,
222
  "eval_loss": NaN,
223
- "eval_runtime": 11.7509,
224
- "eval_samples_per_second": 1143.999,
225
- "eval_steps_per_second": 35.827,
226
- "step": 20166
227
  },
228
  {
229
  "epoch": 7.0,
230
- "grad_norm": 0.35947471857070923,
231
- "learning_rate": 9.000892591490627e-06,
232
- "loss": 0.2689,
233
- "step": 23527
234
  },
235
  {
236
  "epoch": 7.0,
237
- "eval_gate1_accuracy": 0.9231751824817518,
238
- "eval_gate1_f1": 0.9187638476516155,
239
- "eval_gate1_precision": 0.9212794140564127,
240
- "eval_gate1_recall": 0.9165320218048336,
241
- "eval_gate1_support": 5480,
242
- "eval_gate2_accuracy": 0.8671532846715329,
243
- "eval_gate2_f1": 0.8079309552254988,
244
- "eval_gate2_precision": 0.8227266066129817,
245
- "eval_gate2_recall": 0.797751133090433,
246
- "eval_gate2_support": 5480,
247
- "eval_gate3_accuracy": 0.8852411807055436,
248
- "eval_gate3_f1": 0.8088813524226606,
249
- "eval_gate3_precision": 0.8162963874584487,
250
- "eval_gate3_recall": 0.8038531980971689,
251
  "eval_gate3_support": 6945,
252
- "eval_gate4_span_FN": 231,
253
- "eval_gate4_span_FP": 181,
254
- "eval_gate4_span_TP": 776,
255
- "eval_gate4_span_f1": 0.7902240275817516,
256
- "eval_gate4_span_precision": 0.8108672936174413,
257
- "eval_gate4_span_recall": 0.7706057596745719,
258
  "eval_loss": NaN,
259
- "eval_runtime": 11.7438,
260
- "eval_samples_per_second": 1144.692,
261
- "eval_steps_per_second": 35.849,
262
- "step": 23527
263
  },
264
  {
265
  "epoch": 8.0,
266
- "grad_norm": 4.188035488128662,
267
- "learning_rate": 6.000892591490628e-06,
268
- "loss": 0.2153,
269
- "step": 26888
270
  },
271
  {
272
  "epoch": 8.0,
273
- "eval_gate1_accuracy": 0.9224452554744526,
274
- "eval_gate1_f1": 0.9186003567254611,
275
- "eval_gate1_precision": 0.9178172910122369,
276
- "eval_gate1_recall": 0.919420460500135,
277
- "eval_gate1_support": 5480,
278
- "eval_gate2_accuracy": 0.8651459854014598,
279
- "eval_gate2_f1": 0.8062227658402653,
280
- "eval_gate2_precision": 0.8149058818473103,
281
- "eval_gate2_recall": 0.7994866424525817,
282
- "eval_gate2_support": 5480,
283
- "eval_gate3_accuracy": 0.8921526277897768,
284
- "eval_gate3_f1": 0.8158220516262978,
285
- "eval_gate3_precision": 0.8162103501289484,
286
- "eval_gate3_recall": 0.8193325492657668,
287
  "eval_gate3_support": 6945,
288
- "eval_gate4_span_FN": 201,
289
- "eval_gate4_span_FP": 265,
290
- "eval_gate4_span_TP": 806,
291
- "eval_gate4_span_f1": 0.7757459045256693,
292
- "eval_gate4_span_precision": 0.7525676937371376,
293
- "eval_gate4_span_recall": 0.8003972194558053,
294
  "eval_loss": NaN,
295
- "eval_runtime": 11.7492,
296
- "eval_samples_per_second": 1144.16,
297
- "eval_steps_per_second": 35.832,
298
- "step": 26888
299
  },
300
  {
301
  "epoch": 9.0,
302
- "grad_norm": 1.35725998878479,
303
- "learning_rate": 3.0008925914906276e-06,
304
- "loss": 0.1666,
305
- "step": 30249
306
  },
307
  {
308
  "epoch": 9.0,
309
- "eval_gate1_accuracy": 0.9222627737226278,
310
- "eval_gate1_f1": 0.9181949570517217,
311
- "eval_gate1_precision": 0.9184837380555799,
312
- "eval_gate1_recall": 0.9179106871391289,
313
- "eval_gate1_support": 5480,
314
- "eval_gate2_accuracy": 0.8658759124087592,
315
- "eval_gate2_f1": 0.8041530479374372,
316
- "eval_gate2_precision": 0.8198064758030179,
317
- "eval_gate2_recall": 0.7941505361829777,
318
- "eval_gate2_support": 5480,
319
- "eval_gate3_accuracy": 0.8907127429805616,
320
- "eval_gate3_f1": 0.8217501511359249,
321
- "eval_gate3_precision": 0.8178736666290892,
322
- "eval_gate3_recall": 0.8276942456083646,
323
  "eval_gate3_support": 6945,
324
- "eval_gate4_span_FN": 201,
325
- "eval_gate4_span_FP": 245,
326
- "eval_gate4_span_TP": 806,
327
- "eval_gate4_span_f1": 0.7832847374630894,
328
- "eval_gate4_span_precision": 0.7668886774427509,
329
- "eval_gate4_span_recall": 0.8003972194558053,
330
  "eval_loss": NaN,
331
- "eval_runtime": 11.7734,
332
- "eval_samples_per_second": 1141.814,
333
- "eval_steps_per_second": 35.759,
334
- "step": 30249
335
  },
336
  {
337
  "epoch": 10.0,
338
- "grad_norm": 0.6299116015434265,
339
- "learning_rate": 8.925914906277894e-10,
340
- "loss": 0.1296,
341
- "step": 33610
342
  },
343
  {
344
  "epoch": 10.0,
345
- "eval_gate1_accuracy": 0.9246350364963504,
346
- "eval_gate1_f1": 0.9205333497188853,
347
- "eval_gate1_precision": 0.9217073986882154,
348
- "eval_gate1_recall": 0.9194276042067187,
349
- "eval_gate1_support": 5480,
350
- "eval_gate2_accuracy": 0.8678832116788321,
351
- "eval_gate2_f1": 0.8058316251370092,
352
- "eval_gate2_precision": 0.8166158136605832,
353
- "eval_gate2_recall": 0.7978233842024146,
354
- "eval_gate2_support": 5480,
355
- "eval_gate3_accuracy": 0.8917206623470122,
356
- "eval_gate3_f1": 0.8222395535726833,
357
- "eval_gate3_precision": 0.8221736195559818,
358
- "eval_gate3_recall": 0.8242704639947701,
359
  "eval_gate3_support": 6945,
360
- "eval_gate4_span_FN": 203,
361
- "eval_gate4_span_FP": 229,
362
- "eval_gate4_span_TP": 804,
363
- "eval_gate4_span_f1": 0.7882352891107315,
364
- "eval_gate4_span_precision": 0.7783155856652633,
365
- "eval_gate4_span_recall": 0.7984111221370565,
366
  "eval_loss": NaN,
367
- "eval_runtime": 11.7399,
368
- "eval_samples_per_second": 1145.067,
369
- "eval_steps_per_second": 35.861,
370
- "step": 33610
371
  },
372
  {
373
  "epoch": 10.0,
374
- "step": 33610,
375
- "total_flos": 6.757178668346477e+16,
376
- "train_loss": 0.6383435935713073,
377
- "train_runtime": 2441.5872,
378
- "train_samples_per_second": 440.451,
379
- "train_steps_per_second": 13.766
380
  },
381
  {
382
  "epoch": 10.0,
383
- "eval_gate1_accuracy": 0.9246350364963504,
384
- "eval_gate1_f1": 0.9205333497188853,
385
- "eval_gate1_precision": 0.9217073986882154,
386
- "eval_gate1_recall": 0.9194276042067187,
387
- "eval_gate1_support": 5480,
388
- "eval_gate2_accuracy": 0.8678832116788321,
389
- "eval_gate2_f1": 0.8058316251370092,
390
- "eval_gate2_precision": 0.8166158136605832,
391
- "eval_gate2_recall": 0.7978233842024146,
392
- "eval_gate2_support": 5480,
393
- "eval_gate3_accuracy": 0.8917206623470122,
394
- "eval_gate3_f1": 0.8222395535726833,
395
- "eval_gate3_precision": 0.8221736195559818,
396
- "eval_gate3_recall": 0.8242704639947701,
397
  "eval_gate3_support": 6945,
398
- "eval_gate4_span_FN": 203,
399
- "eval_gate4_span_FP": 229,
400
- "eval_gate4_span_TP": 804,
401
- "eval_gate4_span_f1": 0.7882352891107315,
402
- "eval_gate4_span_precision": 0.7783155856652633,
403
- "eval_gate4_span_recall": 0.7984111221370565,
404
  "eval_loss": NaN,
405
- "eval_runtime": 11.7348,
406
- "eval_samples_per_second": 1145.568,
407
- "eval_steps_per_second": 35.876,
408
- "step": 33610
409
  },
410
  {
411
  "epoch": 10.0,
412
- "eval_gate1_accuracy": 0.9213647144681627,
413
- "eval_gate1_f1": 0.9186345562318086,
414
- "eval_gate1_precision": 0.9201991431515453,
415
- "eval_gate1_recall": 0.917244999785811,
416
- "eval_gate1_support": 5481,
417
- "eval_gate2_accuracy": 0.8666301769750046,
418
- "eval_gate2_f1": 0.8084870586267471,
419
- "eval_gate2_precision": 0.8025086025493519,
420
- "eval_gate2_recall": 0.8192604428212116,
421
- "eval_gate2_support": 5481,
422
- "eval_gate3_accuracy": 0.896040316774658,
423
- "eval_gate3_f1": 0.7248294888969216,
424
- "eval_gate3_precision": 0.7283732815204376,
425
- "eval_gate3_recall": 0.7292579147184429,
426
  "eval_gate3_support": 6945,
427
- "eval_gate4_span_FN": 191,
428
- "eval_gate4_span_FP": 216,
429
- "eval_gate4_span_TP": 820,
430
- "eval_gate4_span_f1": 0.8011724424770412,
431
- "eval_gate4_span_precision": 0.7915057914981516,
432
- "eval_gate4_span_recall": 0.8110781404469725,
433
  "eval_loss": NaN,
434
- "eval_runtime": 11.7731,
435
- "eval_samples_per_second": 1141.924,
436
- "eval_steps_per_second": 35.759,
437
- "step": 33610
438
  }
439
  ],
440
  "logging_steps": 500,
441
- "max_steps": 33610,
442
  "num_input_tokens_seen": 0,
443
  "num_train_epochs": 10,
444
  "save_steps": 500,
@@ -454,7 +454,7 @@
454
  "attributes": {}
455
  }
456
  },
457
- "total_flos": 6.757178668346477e+16,
458
  "train_batch_size": 32,
459
  "trial_name": null,
460
  "trial_params": null
 
1
  {
2
+ "best_global_step": 26604,
3
+ "best_metric": 0.9163582001286115,
4
+ "best_model_checkpoint": "output/indra_stmt_classifier/checkpoint-26604",
5
  "epoch": 10.0,
6
  "eval_steps": 500,
7
+ "global_step": 29560,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
11
  "log_history": [
12
  {
13
  "epoch": 1.0,
14
+ "grad_norm": 84.59678649902344,
15
+ "learning_rate": 2.7001014884979704e-05,
16
+ "loss": 2.2672,
17
+ "step": 2956
18
  },
19
  {
20
  "epoch": 1.0,
21
+ "eval_gate1_accuracy": 0.8585125680228038,
22
+ "eval_gate1_f1": 0.8505829142307659,
23
+ "eval_gate1_precision": 0.8473952560532426,
24
+ "eval_gate1_recall": 0.854657238060827,
25
+ "eval_gate1_support": 3859,
26
+ "eval_gate2_accuracy": 0.7587457890645245,
27
+ "eval_gate2_f1": 0.5592993246296689,
28
+ "eval_gate2_precision": 0.6163758861756914,
29
+ "eval_gate2_recall": 0.5543459088227541,
30
+ "eval_gate2_support": 3859,
31
+ "eval_gate3_accuracy": 0.8548596112311015,
32
+ "eval_gate3_f1": 0.6971239789155547,
33
+ "eval_gate3_precision": 0.700932514781479,
34
+ "eval_gate3_recall": 0.7071816387030568,
35
  "eval_gate3_support": 6945,
36
+ "eval_gate4_span_FN": 230,
37
+ "eval_gate4_span_FP": 347,
38
+ "eval_gate4_span_TP": 777,
39
+ "eval_gate4_span_f1": 0.7292350958998283,
40
+ "eval_gate4_span_precision": 0.6912811387838854,
41
+ "eval_gate4_span_recall": 0.7715988083339463,
42
  "eval_loss": NaN,
43
+ "eval_runtime": 10.4486,
44
+ "eval_samples_per_second": 1131.439,
45
+ "eval_steps_per_second": 35.411,
46
+ "step": 2956
47
  },
48
  {
49
  "epoch": 2.0,
50
+ "grad_norm": 88.20085144042969,
51
+ "learning_rate": 2.4001014884979702e-05,
52
+ "loss": 1.2241,
53
+ "step": 5912
54
  },
55
  {
56
  "epoch": 2.0,
57
+ "eval_gate1_accuracy": 0.8929774552993003,
58
+ "eval_gate1_f1": 0.8820620404399862,
59
+ "eval_gate1_precision": 0.8988718775181306,
60
+ "eval_gate1_recall": 0.871612670119234,
61
+ "eval_gate1_support": 3859,
62
+ "eval_gate2_accuracy": 0.808240476807463,
63
+ "eval_gate2_f1": 0.6881412582252169,
64
+ "eval_gate2_precision": 0.6832538631102347,
65
+ "eval_gate2_recall": 0.6996653263704344,
66
+ "eval_gate2_support": 3859,
67
+ "eval_gate3_accuracy": 0.8666666666666667,
68
+ "eval_gate3_f1": 0.744109590199225,
69
+ "eval_gate3_precision": 0.7653765174358127,
70
+ "eval_gate3_recall": 0.7614317320508905,
71
  "eval_gate3_support": 6945,
72
+ "eval_gate4_span_FN": 221,
73
+ "eval_gate4_span_FP": 295,
74
+ "eval_gate4_span_TP": 786,
75
+ "eval_gate4_span_f1": 0.7528735582174595,
76
+ "eval_gate4_span_precision": 0.7271045328332368,
77
+ "eval_gate4_span_recall": 0.7805362462683164,
78
  "eval_loss": NaN,
79
+ "eval_runtime": 10.4006,
80
+ "eval_samples_per_second": 1136.67,
81
+ "eval_steps_per_second": 35.575,
82
+ "step": 5912
83
  },
84
  {
85
  "epoch": 3.0,
86
+ "grad_norm": 67.10189056396484,
87
+ "learning_rate": 2.10010148849797e-05,
88
+ "loss": 0.8652,
89
+ "step": 8868
90
  },
91
  {
92
  "epoch": 3.0,
93
+ "eval_gate1_accuracy": 0.9059341798393367,
94
+ "eval_gate1_f1": 0.8997563137620789,
95
+ "eval_gate1_precision": 0.899055894281647,
96
+ "eval_gate1_recall": 0.9004810366878294,
97
+ "eval_gate1_support": 3859,
98
+ "eval_gate2_accuracy": 0.8333765224151335,
99
+ "eval_gate2_f1": 0.7799911701221585,
100
+ "eval_gate2_precision": 0.8104194561625689,
101
+ "eval_gate2_recall": 0.7600982965627961,
102
+ "eval_gate2_support": 3859,
103
+ "eval_gate3_accuracy": 0.8732901367890569,
104
+ "eval_gate3_f1": 0.7904223821154268,
105
+ "eval_gate3_precision": 0.8444284314763446,
106
+ "eval_gate3_recall": 0.7593577482285429,
107
  "eval_gate3_support": 6945,
108
+ "eval_gate4_span_FN": 236,
109
+ "eval_gate4_span_FP": 228,
110
+ "eval_gate4_span_TP": 771,
111
+ "eval_gate4_span_f1": 0.7686939132376799,
112
+ "eval_gate4_span_precision": 0.7717717717640463,
113
+ "eval_gate4_span_recall": 0.7656405163776997,
114
  "eval_loss": NaN,
115
+ "eval_runtime": 10.3684,
116
+ "eval_samples_per_second": 1140.196,
117
+ "eval_steps_per_second": 35.685,
118
+ "step": 8868
119
  },
120
  {
121
  "epoch": 4.0,
122
+ "grad_norm": 173.31228637695312,
123
+ "learning_rate": 1.8001014884979702e-05,
124
+ "loss": 0.6376,
125
+ "step": 11824
126
  },
127
  {
128
  "epoch": 4.0,
129
+ "eval_gate1_accuracy": 0.9077481212749416,
130
+ "eval_gate1_f1": 0.9007457126723182,
131
+ "eval_gate1_precision": 0.9041686699243279,
132
+ "eval_gate1_recall": 0.8977536805400228,
133
+ "eval_gate1_support": 3859,
134
+ "eval_gate2_accuracy": 0.8419279606115574,
135
+ "eval_gate2_f1": 0.7689803309009853,
136
+ "eval_gate2_precision": 0.7719738299874924,
137
+ "eval_gate2_recall": 0.7762247755795892,
138
+ "eval_gate2_support": 3859,
139
+ "eval_gate3_accuracy": 0.8780417566594673,
140
+ "eval_gate3_f1": 0.8038529609303686,
141
+ "eval_gate3_precision": 0.8238117797554888,
142
+ "eval_gate3_recall": 0.7978850610103051,
143
  "eval_gate3_support": 6945,
144
+ "eval_gate4_span_FN": 218,
145
+ "eval_gate4_span_FP": 226,
146
+ "eval_gate4_span_TP": 789,
147
+ "eval_gate4_span_f1": 0.7804154252594212,
148
+ "eval_gate4_span_precision": 0.777339901470174,
149
+ "eval_gate4_span_recall": 0.7835153922464397,
150
  "eval_loss": NaN,
151
+ "eval_runtime": 10.3445,
152
+ "eval_samples_per_second": 1142.825,
153
+ "eval_steps_per_second": 35.768,
154
+ "step": 11824
155
  },
156
  {
157
  "epoch": 5.0,
158
+ "grad_norm": 22.405181884765625,
159
+ "learning_rate": 1.5001014884979702e-05,
160
+ "loss": 0.4713,
161
+ "step": 14780
162
  },
163
  {
164
  "epoch": 5.0,
165
+ "eval_gate1_accuracy": 0.9124125421093547,
166
+ "eval_gate1_f1": 0.905395262879988,
167
+ "eval_gate1_precision": 0.9108288424356044,
168
+ "eval_gate1_recall": 0.9009235044132069,
169
+ "eval_gate1_support": 3859,
170
+ "eval_gate2_accuracy": 0.8608447784400104,
171
+ "eval_gate2_f1": 0.7846052784615595,
172
+ "eval_gate2_precision": 0.7779462341191327,
173
+ "eval_gate2_recall": 0.8035688815922226,
174
+ "eval_gate2_support": 3859,
175
+ "eval_gate3_accuracy": 0.8822174226061915,
176
+ "eval_gate3_f1": 0.799720850034007,
177
+ "eval_gate3_precision": 0.7922933108551248,
178
+ "eval_gate3_recall": 0.8164975006789633,
179
  "eval_gate3_support": 6945,
180
+ "eval_gate4_span_FN": 217,
181
+ "eval_gate4_span_FP": 204,
182
+ "eval_gate4_span_TP": 790,
183
+ "eval_gate4_span_f1": 0.7896051923936183,
184
+ "eval_gate4_span_precision": 0.7947686116620245,
185
+ "eval_gate4_span_recall": 0.7845084409058142,
186
  "eval_loss": NaN,
187
+ "eval_runtime": 10.3367,
188
+ "eval_samples_per_second": 1143.691,
189
+ "eval_steps_per_second": 35.795,
190
+ "step": 14780
191
  },
192
  {
193
  "epoch": 6.0,
194
+ "grad_norm": 150.47354125976562,
195
+ "learning_rate": 1.2001014884979702e-05,
196
+ "loss": 0.3573,
197
+ "step": 17736
198
  },
199
  {
200
  "epoch": 6.0,
201
+ "eval_gate1_accuracy": 0.9168178284529671,
202
+ "eval_gate1_f1": 0.91133041633164,
203
+ "eval_gate1_precision": 0.9107173896884344,
204
+ "eval_gate1_recall": 0.9119611098684928,
205
+ "eval_gate1_support": 3859,
206
+ "eval_gate2_accuracy": 0.8647317958020212,
207
+ "eval_gate2_f1": 0.7980336380648058,
208
+ "eval_gate2_precision": 0.8117843067907142,
209
+ "eval_gate2_recall": 0.7909589217708924,
210
+ "eval_gate2_support": 3859,
211
+ "eval_gate3_accuracy": 0.8846652267818574,
212
+ "eval_gate3_f1": 0.7968635418767978,
213
+ "eval_gate3_precision": 0.8025916830061807,
214
+ "eval_gate3_recall": 0.7966439892081336,
215
  "eval_gate3_support": 6945,
216
+ "eval_gate4_span_FN": 198,
217
+ "eval_gate4_span_FP": 242,
218
+ "eval_gate4_span_TP": 809,
219
+ "eval_gate4_span_f1": 0.786200189358105,
220
+ "eval_gate4_span_precision": 0.7697431018004782,
221
+ "eval_gate4_span_recall": 0.8033763654339288,
222
  "eval_loss": NaN,
223
+ "eval_runtime": 10.3401,
224
+ "eval_samples_per_second": 1143.318,
225
+ "eval_steps_per_second": 35.783,
226
+ "step": 17736
227
  },
228
  {
229
  "epoch": 7.0,
230
+ "grad_norm": 270.212646484375,
231
+ "learning_rate": 9.001014884979702e-06,
232
+ "loss": 0.2711,
233
+ "step": 20692
234
  },
235
  {
236
  "epoch": 7.0,
237
+ "eval_gate1_accuracy": 0.9191500388701737,
238
+ "eval_gate1_f1": 0.9137570612727655,
239
+ "eval_gate1_precision": 0.9134164984755443,
240
+ "eval_gate1_recall": 0.9141029060064348,
241
+ "eval_gate1_support": 3859,
242
+ "eval_gate2_accuracy": 0.8693962166364343,
243
+ "eval_gate2_f1": 0.8124767328435765,
244
+ "eval_gate2_precision": 0.8061838445118481,
245
+ "eval_gate2_recall": 0.8279748920673979,
246
+ "eval_gate2_support": 3859,
247
+ "eval_gate3_accuracy": 0.8862491000719942,
248
+ "eval_gate3_f1": 0.8027532601826777,
249
+ "eval_gate3_precision": 0.7866745156811082,
250
+ "eval_gate3_recall": 0.8226565082669126,
251
  "eval_gate3_support": 6945,
252
+ "eval_gate4_span_FN": 251,
253
+ "eval_gate4_span_FP": 213,
254
+ "eval_gate4_span_TP": 756,
255
+ "eval_gate4_span_f1": 0.7651821812289223,
256
+ "eval_gate4_span_precision": 0.7801857585058805,
257
+ "eval_gate4_span_recall": 0.750744786487083,
258
  "eval_loss": NaN,
259
+ "eval_runtime": 10.4102,
260
+ "eval_samples_per_second": 1135.613,
261
+ "eval_steps_per_second": 35.542,
262
+ "step": 20692
263
  },
264
  {
265
  "epoch": 8.0,
266
+ "grad_norm": 30.083831787109375,
267
+ "learning_rate": 6.001014884979703e-06,
268
+ "loss": 0.2072,
269
+ "step": 23648
270
  },
271
  {
272
  "epoch": 8.0,
273
+ "eval_gate1_accuracy": 0.9194091733609744,
274
+ "eval_gate1_f1": 0.9136575067455691,
275
+ "eval_gate1_precision": 0.9151861735925785,
276
+ "eval_gate1_recall": 0.9122216295888463,
277
+ "eval_gate1_support": 3859,
278
+ "eval_gate2_accuracy": 0.8683596786732314,
279
+ "eval_gate2_f1": 0.7953213528224212,
280
+ "eval_gate2_precision": 0.7941072643208182,
281
+ "eval_gate2_recall": 0.8039876906998746,
282
+ "eval_gate2_support": 3859,
283
+ "eval_gate3_accuracy": 0.8859611231101512,
284
+ "eval_gate3_f1": 0.8067851499228712,
285
+ "eval_gate3_precision": 0.8044692044507203,
286
+ "eval_gate3_recall": 0.8120360484679332,
287
  "eval_gate3_support": 6945,
288
+ "eval_gate4_span_FN": 211,
289
+ "eval_gate4_span_FP": 223,
290
+ "eval_gate4_span_TP": 796,
291
+ "eval_gate4_span_f1": 0.7857847926232181,
292
+ "eval_gate4_span_precision": 0.7811579980296255,
293
+ "eval_gate4_span_recall": 0.7904667328620609,
294
  "eval_loss": NaN,
295
+ "eval_runtime": 10.415,
296
+ "eval_samples_per_second": 1135.098,
297
+ "eval_steps_per_second": 35.526,
298
+ "step": 23648
299
  },
300
  {
301
  "epoch": 9.0,
302
+ "grad_norm": 303.0519104003906,
303
+ "learning_rate": 3.0010148849797024e-06,
304
+ "loss": 0.1509,
305
+ "step": 26604
306
  },
307
  {
308
  "epoch": 9.0,
309
+ "eval_gate1_accuracy": 0.9217413837781808,
310
+ "eval_gate1_f1": 0.9163582001286115,
311
+ "eval_gate1_precision": 0.9168310136033854,
312
+ "eval_gate1_recall": 0.915894857280501,
313
+ "eval_gate1_support": 3859,
314
+ "eval_gate2_accuracy": 0.8717284270536408,
315
+ "eval_gate2_f1": 0.8542694094275488,
316
+ "eval_gate2_precision": 0.8495135391288109,
317
+ "eval_gate2_recall": 0.8711254994444528,
318
+ "eval_gate2_support": 3859,
319
+ "eval_gate3_accuracy": 0.8866810655147588,
320
+ "eval_gate3_f1": 0.8118642371342876,
321
+ "eval_gate3_precision": 0.8115033608543574,
322
+ "eval_gate3_recall": 0.8169535217733972,
323
  "eval_gate3_support": 6945,
324
+ "eval_gate4_span_FN": 216,
325
+ "eval_gate4_span_FP": 233,
326
+ "eval_gate4_span_TP": 791,
327
+ "eval_gate4_span_f1": 0.7789266321172492,
328
+ "eval_gate4_span_precision": 0.7724609374924565,
329
+ "eval_gate4_span_recall": 0.7855014895651886,
330
  "eval_loss": NaN,
331
+ "eval_runtime": 10.45,
332
+ "eval_samples_per_second": 1131.292,
333
+ "eval_steps_per_second": 35.407,
334
+ "step": 26604
335
  },
336
  {
337
  "epoch": 10.0,
338
+ "grad_norm": 4.396928310394287,
339
+ "learning_rate": 1.0148849797023006e-09,
340
+ "loss": 0.122,
341
+ "step": 29560
342
  },
343
  {
344
  "epoch": 10.0,
345
+ "eval_gate1_accuracy": 0.9212231147965795,
346
+ "eval_gate1_f1": 0.9159218285491496,
347
+ "eval_gate1_precision": 0.915806583633259,
348
+ "eval_gate1_recall": 0.9160376628069029,
349
+ "eval_gate1_support": 3859,
350
+ "eval_gate2_accuracy": 0.8722466960352423,
351
+ "eval_gate2_f1": 0.856680976809179,
352
+ "eval_gate2_precision": 0.8659863944374855,
353
+ "eval_gate2_recall": 0.8537404898111944,
354
+ "eval_gate2_support": 3859,
355
+ "eval_gate3_accuracy": 0.8875449964002879,
356
+ "eval_gate3_f1": 0.8118433314020443,
357
+ "eval_gate3_precision": 0.8153146247248837,
358
+ "eval_gate3_recall": 0.8127560834123785,
359
  "eval_gate3_support": 6945,
360
+ "eval_gate4_span_FN": 213,
361
+ "eval_gate4_span_FP": 233,
362
+ "eval_gate4_span_TP": 794,
363
+ "eval_gate4_span_f1": 0.7807276252779591,
364
+ "eval_gate4_span_precision": 0.7731256085611187,
365
+ "eval_gate4_span_recall": 0.788480635543312,
366
  "eval_loss": NaN,
367
+ "eval_runtime": 10.3467,
368
+ "eval_samples_per_second": 1142.581,
369
+ "eval_steps_per_second": 35.76,
370
+ "step": 29560
371
  },
372
  {
373
  "epoch": 10.0,
374
+ "step": 29560,
375
+ "total_flos": 5.801469413818084e+16,
376
+ "train_loss": 0.6573912851542678,
377
+ "train_runtime": 2140.4043,
378
+ "train_samples_per_second": 441.828,
379
+ "train_steps_per_second": 13.81
380
  },
381
  {
382
  "epoch": 10.0,
383
+ "eval_gate1_accuracy": 0.9217413837781808,
384
+ "eval_gate1_f1": 0.9163582001286115,
385
+ "eval_gate1_precision": 0.9168310136033854,
386
+ "eval_gate1_recall": 0.915894857280501,
387
+ "eval_gate1_support": 3859,
388
+ "eval_gate2_accuracy": 0.8717284270536408,
389
+ "eval_gate2_f1": 0.8542694094275488,
390
+ "eval_gate2_precision": 0.8495135391288109,
391
+ "eval_gate2_recall": 0.8711254994444528,
392
+ "eval_gate2_support": 3859,
393
+ "eval_gate3_accuracy": 0.8866810655147588,
394
+ "eval_gate3_f1": 0.8118642371342876,
395
+ "eval_gate3_precision": 0.8115033608543574,
396
+ "eval_gate3_recall": 0.8169535217733972,
397
  "eval_gate3_support": 6945,
398
+ "eval_gate4_span_FN": 216,
399
+ "eval_gate4_span_FP": 233,
400
+ "eval_gate4_span_TP": 791,
401
+ "eval_gate4_span_f1": 0.7789266321172492,
402
+ "eval_gate4_span_precision": 0.7724609374924565,
403
+ "eval_gate4_span_recall": 0.7855014895651886,
404
  "eval_loss": NaN,
405
+ "eval_runtime": 10.4531,
406
+ "eval_samples_per_second": 1130.954,
407
+ "eval_steps_per_second": 35.396,
408
+ "step": 29560
409
  },
410
  {
411
  "epoch": 10.0,
412
+ "eval_gate1_accuracy": 0.9251295336787565,
413
+ "eval_gate1_f1": 0.9199371922438249,
414
+ "eval_gate1_precision": 0.920966070966071,
415
+ "eval_gate1_recall": 0.9189513092953367,
416
+ "eval_gate1_support": 3860,
417
+ "eval_gate2_accuracy": 0.8709844559585492,
418
+ "eval_gate2_f1": 0.8487797208181732,
419
+ "eval_gate2_precision": 0.8500529357712848,
420
+ "eval_gate2_recall": 0.8532136788618205,
421
+ "eval_gate2_support": 3860,
422
+ "eval_gate3_accuracy": 0.8920086393088553,
423
+ "eval_gate3_f1": 0.6992827001481418,
424
+ "eval_gate3_precision": 0.715591871957983,
425
+ "eval_gate3_recall": 0.7063340262769819,
426
  "eval_gate3_support": 6945,
427
+ "eval_gate4_span_FN": 196,
428
+ "eval_gate4_span_FP": 204,
429
+ "eval_gate4_span_TP": 815,
430
+ "eval_gate4_span_f1": 0.8029556600167974,
431
+ "eval_gate4_span_precision": 0.7998037291383728,
432
+ "eval_gate4_span_recall": 0.8061325420296129,
433
  "eval_loss": NaN,
434
+ "eval_runtime": 10.4274,
435
+ "eval_samples_per_second": 1133.841,
436
+ "eval_steps_per_second": 35.483,
437
+ "step": 29560
438
  }
439
  ],
440
  "logging_steps": 500,
441
+ "max_steps": 29560,
442
  "num_input_tokens_seen": 0,
443
  "num_train_epochs": 10,
444
  "save_steps": 500,
 
454
  "attributes": {}
455
  }
456
  },
457
+ "total_flos": 5.801469413818084e+16,
458
  "train_batch_size": 32,
459
  "trial_name": null,
460
  "trial_params": null
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fc2cd185761d66131bcc0f43bbd2ae2a01a355c15e6af12eb5fb05584d22f893
3
  size 5841
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bcf99fea5e0d29ea31021a60b825b759ebcc369e52c3076e24dd45d270cb7764
3
  size 5841