File size: 7,514 Bytes
54ca777
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
{
  "best_metric": 0.21624045073986053,
  "best_model_checkpoint": "/hpcwork/vg380347/NER/EduGBERT/checkpoint-550",
  "epoch": 7.446808510638298,
  "eval_steps": 50,
  "global_step": 1050,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 0.35,
      "eval_f1": 0.5815712900096993,
      "eval_loss": 0.3045153319835663,
      "eval_precision": 0.5216332212040367,
      "eval_recall": 0.6570718877849211,
      "eval_runtime": 7.1562,
      "eval_samples_per_second": 629.381,
      "eval_steps_per_second": 5.031,
      "step": 50
    },
    {
      "epoch": 0.71,
      "eval_f1": 0.6822522225880804,
      "eval_loss": 0.25079214572906494,
      "eval_precision": 0.6210286536386525,
      "eval_recall": 0.7568673290473408,
      "eval_runtime": 7.2954,
      "eval_samples_per_second": 617.376,
      "eval_steps_per_second": 4.935,
      "step": 100
    },
    {
      "epoch": 1.06,
      "eval_f1": 0.7016087182148418,
      "eval_loss": 0.24814821779727936,
      "eval_precision": 0.6308912739150724,
      "eval_recall": 0.7901811805961426,
      "eval_runtime": 7.1783,
      "eval_samples_per_second": 627.45,
      "eval_steps_per_second": 5.015,
      "step": 150
    },
    {
      "epoch": 1.42,
      "eval_f1": 0.7199271355149306,
      "eval_loss": 0.2445540428161621,
      "eval_precision": 0.6488800281458895,
      "eval_recall": 0.8084453535943893,
      "eval_runtime": 7.1384,
      "eval_samples_per_second": 630.95,
      "eval_steps_per_second": 5.043,
      "step": 200
    },
    {
      "epoch": 1.77,
      "eval_f1": 0.722252082773448,
      "eval_loss": 0.22964715957641602,
      "eval_precision": 0.6685323383084577,
      "eval_recall": 0.7853594389246055,
      "eval_runtime": 7.434,
      "eval_samples_per_second": 605.866,
      "eval_steps_per_second": 4.843,
      "step": 250
    },
    {
      "epoch": 2.13,
      "eval_f1": 0.7319960997353392,
      "eval_loss": 0.21758420765399933,
      "eval_precision": 0.6993611924407772,
      "eval_recall": 0.7678258328462887,
      "eval_runtime": 7.1469,
      "eval_samples_per_second": 630.207,
      "eval_steps_per_second": 5.037,
      "step": 300
    },
    {
      "epoch": 2.48,
      "eval_f1": 0.7406113537117905,
      "eval_loss": 0.22185301780700684,
      "eval_precision": 0.6854868797413257,
      "eval_recall": 0.8053769725306839,
      "eval_runtime": 7.1574,
      "eval_samples_per_second": 629.281,
      "eval_steps_per_second": 5.03,
      "step": 350
    },
    {
      "epoch": 2.84,
      "eval_f1": 0.7412340309866812,
      "eval_loss": 0.2164618819952011,
      "eval_precision": 0.6928353658536586,
      "eval_recall": 0.7969023962594973,
      "eval_runtime": 7.1409,
      "eval_samples_per_second": 630.735,
      "eval_steps_per_second": 5.041,
      "step": 400
    },
    {
      "epoch": 3.19,
      "eval_f1": 0.7499483221938952,
      "eval_loss": 0.2220638245344162,
      "eval_precision": 0.7096101186595384,
      "eval_recall": 0.7951490356516657,
      "eval_runtime": 7.4483,
      "eval_samples_per_second": 604.703,
      "eval_steps_per_second": 4.833,
      "step": 450
    },
    {
      "epoch": 3.55,
      "learning_rate": 4.822695035460993e-06,
      "loss": 0.2581,
      "step": 500
    },
    {
      "epoch": 3.55,
      "eval_f1": 0.7439247452312516,
      "eval_loss": 0.2487693727016449,
      "eval_precision": 0.6727315689981096,
      "eval_recall": 0.8319696084161309,
      "eval_runtime": 7.1497,
      "eval_samples_per_second": 629.957,
      "eval_steps_per_second": 5.035,
      "step": 500
    },
    {
      "epoch": 3.9,
      "eval_f1": 0.7555155958226711,
      "eval_loss": 0.21624045073986053,
      "eval_precision": 0.717268548916612,
      "eval_recall": 0.7980713033313852,
      "eval_runtime": 7.1536,
      "eval_samples_per_second": 629.612,
      "eval_steps_per_second": 5.032,
      "step": 550
    },
    {
      "epoch": 4.26,
      "eval_f1": 0.7588671611598112,
      "eval_loss": 0.23951853811740875,
      "eval_precision": 0.7046080641121963,
      "eval_recall": 0.8221800116890707,
      "eval_runtime": 7.0397,
      "eval_samples_per_second": 639.8,
      "eval_steps_per_second": 5.114,
      "step": 600
    },
    {
      "epoch": 4.61,
      "eval_f1": 0.7562726374711887,
      "eval_loss": 0.24661774933338165,
      "eval_precision": 0.688406665867402,
      "eval_recall": 0.8389830508474576,
      "eval_runtime": 7.1388,
      "eval_samples_per_second": 630.916,
      "eval_steps_per_second": 5.043,
      "step": 650
    },
    {
      "epoch": 4.96,
      "eval_f1": 0.7577822311289245,
      "eval_loss": 0.24025806784629822,
      "eval_precision": 0.6980063992124046,
      "eval_recall": 0.8287551139684395,
      "eval_runtime": 7.1329,
      "eval_samples_per_second": 631.441,
      "eval_steps_per_second": 5.047,
      "step": 700
    },
    {
      "epoch": 5.32,
      "eval_f1": 0.7517815517815518,
      "eval_loss": 0.261866956949234,
      "eval_precision": 0.6907355280871375,
      "eval_recall": 0.8246639392168322,
      "eval_runtime": 7.3254,
      "eval_samples_per_second": 614.846,
      "eval_steps_per_second": 4.914,
      "step": 750
    },
    {
      "epoch": 5.67,
      "eval_f1": 0.7615306467998646,
      "eval_loss": 0.2429821491241455,
      "eval_precision": 0.7097588688296932,
      "eval_recall": 0.8214494447691408,
      "eval_runtime": 7.1352,
      "eval_samples_per_second": 631.236,
      "eval_steps_per_second": 5.045,
      "step": 800
    },
    {
      "epoch": 6.03,
      "eval_f1": 0.7594460131773565,
      "eval_loss": 0.24021703004837036,
      "eval_precision": 0.7033623910336239,
      "eval_recall": 0.8252483927527762,
      "eval_runtime": 7.155,
      "eval_samples_per_second": 629.489,
      "eval_steps_per_second": 5.031,
      "step": 850
    },
    {
      "epoch": 6.38,
      "eval_f1": 0.7594716019580233,
      "eval_loss": 0.25845229625701904,
      "eval_precision": 0.70182178708638,
      "eval_recall": 0.8274400935125658,
      "eval_runtime": 7.1743,
      "eval_samples_per_second": 627.796,
      "eval_steps_per_second": 5.018,
      "step": 900
    },
    {
      "epoch": 6.74,
      "eval_f1": 0.7634940255459416,
      "eval_loss": 0.2463415563106537,
      "eval_precision": 0.7202643171806168,
      "eval_recall": 0.8122443015780245,
      "eval_runtime": 7.1315,
      "eval_samples_per_second": 631.568,
      "eval_steps_per_second": 5.048,
      "step": 950
    },
    {
      "epoch": 7.09,
      "learning_rate": 4.645390070921986e-06,
      "loss": 0.1517,
      "step": 1000
    },
    {
      "epoch": 7.09,
      "eval_f1": 0.7641669494401085,
      "eval_loss": 0.25761693716049194,
      "eval_precision": 0.7134710429603346,
      "eval_recall": 0.8226183518410286,
      "eval_runtime": 7.1379,
      "eval_samples_per_second": 630.995,
      "eval_steps_per_second": 5.043,
      "step": 1000
    },
    {
      "epoch": 7.45,
      "eval_f1": 0.7703476197124111,
      "eval_loss": 0.2536332607269287,
      "eval_precision": 0.7375033413525796,
      "eval_recall": 0.8062536528345996,
      "eval_runtime": 7.1375,
      "eval_samples_per_second": 631.035,
      "eval_steps_per_second": 5.044,
      "step": 1050
    }
  ],
  "logging_steps": 500,
  "max_steps": 14100,
  "num_train_epochs": 100,
  "save_steps": 50,
  "total_flos": 6.408198647855674e+16,
  "trial_name": null,
  "trial_params": null
}