File size: 12,200 Bytes
345d0ac
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
{
  "best_global_step": 2500,
  "best_metric": 0.8745242401633876,
  "best_model_checkpoint": "models\\improved_model\\checkpoint-2500",
  "epoch": 5.0,
  "eval_steps": 500,
  "global_step": 3435,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 0.14556040756914118,
      "grad_norm": 5.4006147384643555,
      "learning_rate": 9.900000000000002e-06,
      "loss": 1.0779,
      "step": 100
    },
    {
      "epoch": 0.29112081513828236,
      "grad_norm": 7.964382171630859,
      "learning_rate": 1.9900000000000003e-05,
      "loss": 0.3444,
      "step": 200
    },
    {
      "epoch": 0.4366812227074236,
      "grad_norm": 6.473100185394287,
      "learning_rate": 2.9900000000000002e-05,
      "loss": 0.2621,
      "step": 300
    },
    {
      "epoch": 0.5822416302765647,
      "grad_norm": 2.3269290924072266,
      "learning_rate": 3.99e-05,
      "loss": 0.2215,
      "step": 400
    },
    {
      "epoch": 0.727802037845706,
      "grad_norm": 1.0794602632522583,
      "learning_rate": 4.99e-05,
      "loss": 0.1994,
      "step": 500
    },
    {
      "epoch": 0.727802037845706,
      "eval_accuracy": 0.8291404612159329,
      "eval_f1": 0.8347849048667186,
      "eval_f1_bearish": 0.7192982456140351,
      "eval_f1_bullish": 0.8773747841105354,
      "eval_f1_neutral": 0.7843137254901961,
      "eval_loss": 0.16642487049102783,
      "eval_precision": 0.8522584333905088,
      "eval_precision_bearish": 0.6212121212121212,
      "eval_precision_bullish": 0.9407407407407408,
      "eval_precision_neutral": 0.7407407407407407,
      "eval_recall": 0.8291404612159329,
      "eval_recall_bearish": 0.8541666666666666,
      "eval_recall_bullish": 0.8220064724919094,
      "eval_recall_neutral": 0.8333333333333334,
      "eval_runtime": 8.1987,
      "eval_samples_per_second": 116.359,
      "eval_steps_per_second": 3.659,
      "step": 500
    },
    {
      "epoch": 0.8733624454148472,
      "grad_norm": 10.456722259521484,
      "learning_rate": 4.831345826235094e-05,
      "loss": 0.1798,
      "step": 600
    },
    {
      "epoch": 1.0189228529839884,
      "grad_norm": 0.8317745327949524,
      "learning_rate": 4.660988074957411e-05,
      "loss": 0.1477,
      "step": 700
    },
    {
      "epoch": 1.1644832605531295,
      "grad_norm": 13.93519401550293,
      "learning_rate": 4.490630323679728e-05,
      "loss": 0.1027,
      "step": 800
    },
    {
      "epoch": 1.3100436681222707,
      "grad_norm": 5.650792598724365,
      "learning_rate": 4.320272572402044e-05,
      "loss": 0.1093,
      "step": 900
    },
    {
      "epoch": 1.455604075691412,
      "grad_norm": 2.2038004398345947,
      "learning_rate": 4.1499148211243615e-05,
      "loss": 0.1091,
      "step": 1000
    },
    {
      "epoch": 1.455604075691412,
      "eval_accuracy": 0.8542976939203354,
      "eval_f1": 0.854962642061992,
      "eval_f1_bearish": 0.7436823104693141,
      "eval_f1_bullish": 0.9034369885433715,
      "eval_f1_neutral": 0.78239608801956,
      "eval_loss": 0.22784079611301422,
      "eval_precision": 0.85731689649448,
      "eval_precision_bearish": 0.7744360902255639,
      "eval_precision_bullish": 0.9139072847682119,
      "eval_precision_neutral": 0.7373271889400922,
      "eval_recall": 0.8542976939203354,
      "eval_recall_bearish": 0.7152777777777778,
      "eval_recall_bullish": 0.8932038834951457,
      "eval_recall_neutral": 0.8333333333333334,
      "eval_runtime": 8.8257,
      "eval_samples_per_second": 108.094,
      "eval_steps_per_second": 3.399,
      "step": 1000
    },
    {
      "epoch": 1.6011644832605532,
      "grad_norm": 4.665580749511719,
      "learning_rate": 3.9795570698466784e-05,
      "loss": 0.0851,
      "step": 1100
    },
    {
      "epoch": 1.7467248908296944,
      "grad_norm": 0.20554736256599426,
      "learning_rate": 3.809199318568995e-05,
      "loss": 0.0983,
      "step": 1200
    },
    {
      "epoch": 1.8922852983988356,
      "grad_norm": 2.3172614574432373,
      "learning_rate": 3.638841567291312e-05,
      "loss": 0.0908,
      "step": 1300
    },
    {
      "epoch": 2.037845705967977,
      "grad_norm": 0.20416907966136932,
      "learning_rate": 3.468483816013629e-05,
      "loss": 0.072,
      "step": 1400
    },
    {
      "epoch": 2.183406113537118,
      "grad_norm": 0.08527473360300064,
      "learning_rate": 3.298126064735946e-05,
      "loss": 0.0316,
      "step": 1500
    },
    {
      "epoch": 2.183406113537118,
      "eval_accuracy": 0.8616352201257862,
      "eval_f1": 0.8636672911856373,
      "eval_f1_bearish": 0.7516339869281046,
      "eval_f1_bullish": 0.9054726368159204,
      "eval_f1_neutral": 0.8131313131313131,
      "eval_loss": 0.24344488978385925,
      "eval_precision": 0.8675144411363428,
      "eval_precision_bearish": 0.7098765432098766,
      "eval_precision_bullish": 0.9285714285714286,
      "eval_precision_neutral": 0.7892156862745098,
      "eval_recall": 0.8616352201257862,
      "eval_recall_bearish": 0.7986111111111112,
      "eval_recall_bullish": 0.883495145631068,
      "eval_recall_neutral": 0.8385416666666666,
      "eval_runtime": 8.6074,
      "eval_samples_per_second": 110.835,
      "eval_steps_per_second": 3.485,
      "step": 1500
    },
    {
      "epoch": 2.328966521106259,
      "grad_norm": 7.853630065917969,
      "learning_rate": 3.1277683134582626e-05,
      "loss": 0.0363,
      "step": 1600
    },
    {
      "epoch": 2.4745269286754,
      "grad_norm": 0.3771085739135742,
      "learning_rate": 2.957410562180579e-05,
      "loss": 0.0347,
      "step": 1700
    },
    {
      "epoch": 2.6200873362445414,
      "grad_norm": 3.0605719089508057,
      "learning_rate": 2.787052810902896e-05,
      "loss": 0.0319,
      "step": 1800
    },
    {
      "epoch": 2.7656477438136826,
      "grad_norm": 3.2105116844177246,
      "learning_rate": 2.616695059625213e-05,
      "loss": 0.0359,
      "step": 1900
    },
    {
      "epoch": 2.911208151382824,
      "grad_norm": 3.7454285621643066,
      "learning_rate": 2.44633730834753e-05,
      "loss": 0.0361,
      "step": 2000
    },
    {
      "epoch": 2.911208151382824,
      "eval_accuracy": 0.8584905660377359,
      "eval_f1": 0.8593807235316668,
      "eval_f1_bearish": 0.7571428571428571,
      "eval_f1_bullish": 0.9074529074529074,
      "eval_f1_neutral": 0.7813267813267813,
      "eval_loss": 0.2744849622249603,
      "eval_precision": 0.8616426481335732,
      "eval_precision_bearish": 0.7794117647058824,
      "eval_precision_bullish": 0.9187396351575456,
      "eval_precision_neutral": 0.7395348837209302,
      "eval_recall": 0.8584905660377359,
      "eval_recall_bearish": 0.7361111111111112,
      "eval_recall_bullish": 0.8964401294498382,
      "eval_recall_neutral": 0.828125,
      "eval_runtime": 8.1534,
      "eval_samples_per_second": 117.007,
      "eval_steps_per_second": 3.679,
      "step": 2000
    },
    {
      "epoch": 3.056768558951965,
      "grad_norm": 0.04752872511744499,
      "learning_rate": 2.2759795570698465e-05,
      "loss": 0.0169,
      "step": 2100
    },
    {
      "epoch": 3.2023289665211063,
      "grad_norm": 3.445439100265503,
      "learning_rate": 2.1056218057921637e-05,
      "loss": 0.0094,
      "step": 2200
    },
    {
      "epoch": 3.3478893740902476,
      "grad_norm": 1.7491494417190552,
      "learning_rate": 1.9352640545144805e-05,
      "loss": 0.0084,
      "step": 2300
    },
    {
      "epoch": 3.493449781659389,
      "grad_norm": 1.3558599948883057,
      "learning_rate": 1.7649063032367974e-05,
      "loss": 0.0155,
      "step": 2400
    },
    {
      "epoch": 3.6390101892285296,
      "grad_norm": 0.7178720235824585,
      "learning_rate": 1.5945485519591142e-05,
      "loss": 0.0166,
      "step": 2500
    },
    {
      "epoch": 3.6390101892285296,
      "eval_accuracy": 0.8752620545073375,
      "eval_f1": 0.8745242401633876,
      "eval_f1_bearish": 0.7612456747404844,
      "eval_f1_bullish": 0.9131474103585657,
      "eval_f1_neutral": 0.8351648351648352,
      "eval_loss": 0.27798759937286377,
      "eval_precision": 0.8750783502197678,
      "eval_precision_bearish": 0.7586206896551724,
      "eval_precision_bullish": 0.8995290423861853,
      "eval_precision_neutral": 0.8837209302325582,
      "eval_recall": 0.8752620545073375,
      "eval_recall_bearish": 0.7638888888888888,
      "eval_recall_bullish": 0.9271844660194175,
      "eval_recall_neutral": 0.7916666666666666,
      "eval_runtime": 8.5538,
      "eval_samples_per_second": 111.529,
      "eval_steps_per_second": 3.507,
      "step": 2500
    },
    {
      "epoch": 3.7845705967976713,
      "grad_norm": 0.5409824252128601,
      "learning_rate": 1.424190800681431e-05,
      "loss": 0.0072,
      "step": 2600
    },
    {
      "epoch": 3.930131004366812,
      "grad_norm": 0.007624503690749407,
      "learning_rate": 1.253833049403748e-05,
      "loss": 0.0051,
      "step": 2700
    },
    {
      "epoch": 4.075691411935954,
      "grad_norm": 0.03979913145303726,
      "learning_rate": 1.0834752981260648e-05,
      "loss": 0.0106,
      "step": 2800
    },
    {
      "epoch": 4.2212518195050945,
      "grad_norm": 0.025390487164258957,
      "learning_rate": 9.131175468483816e-06,
      "loss": 0.003,
      "step": 2900
    },
    {
      "epoch": 4.366812227074236,
      "grad_norm": 8.90622615814209,
      "learning_rate": 7.427597955706985e-06,
      "loss": 0.0066,
      "step": 3000
    },
    {
      "epoch": 4.366812227074236,
      "eval_accuracy": 0.8742138364779874,
      "eval_f1": 0.8740584051302639,
      "eval_f1_bearish": 0.7659574468085106,
      "eval_f1_bullish": 0.9174757281553398,
      "eval_f1_neutral": 0.8153846153846154,
      "eval_loss": 0.3259490132331848,
      "eval_precision": 0.8740853986957351,
      "eval_precision_bearish": 0.782608695652174,
      "eval_precision_bullish": 0.9174757281553398,
      "eval_precision_neutral": 0.803030303030303,
      "eval_recall": 0.8742138364779874,
      "eval_recall_bearish": 0.75,
      "eval_recall_bullish": 0.9174757281553398,
      "eval_recall_neutral": 0.828125,
      "eval_runtime": 9.0626,
      "eval_samples_per_second": 105.268,
      "eval_steps_per_second": 3.31,
      "step": 3000
    },
    {
      "epoch": 4.512372634643377,
      "grad_norm": 0.0042578354477882385,
      "learning_rate": 5.724020442930154e-06,
      "loss": 0.0021,
      "step": 3100
    },
    {
      "epoch": 4.657933042212518,
      "grad_norm": 0.0550072155892849,
      "learning_rate": 4.0204429301533224e-06,
      "loss": 0.0065,
      "step": 3200
    },
    {
      "epoch": 4.8034934497816595,
      "grad_norm": 0.019497277215123177,
      "learning_rate": 2.3168654173764905e-06,
      "loss": 0.0023,
      "step": 3300
    },
    {
      "epoch": 4.9490538573508,
      "grad_norm": 0.012889917939901352,
      "learning_rate": 6.132879045996593e-07,
      "loss": 0.0031,
      "step": 3400
    }
  ],
  "logging_steps": 100,
  "max_steps": 3435,
  "num_input_tokens_seen": 0,
  "num_train_epochs": 5,
  "save_steps": 500,
  "stateful_callbacks": {
    "EarlyStoppingCallback": {
      "args": {
        "early_stopping_patience": 3,
        "early_stopping_threshold": 0.0
      },
      "attributes": {
        "early_stopping_patience_counter": 1
      }
    },
    "TrainerControl": {
      "args": {
        "should_epoch_stop": false,
        "should_evaluate": false,
        "should_log": false,
        "should_save": true,
        "should_training_stop": true
      },
      "attributes": {}
    }
  },
  "total_flos": 1.444624220035584e+16,
  "train_batch_size": 16,
  "trial_name": null,
  "trial_params": null
}