JonahDelman commited on
Commit
03261b2
·
1 Parent(s): 187d014

Delete trainer_state.json

Browse files
Files changed (1) hide show
  1. trainer_state.json +0 -193
trainer_state.json DELETED
@@ -1,193 +0,0 @@
1
- {
2
- "best_global_step": 50,
3
- "best_metric": 0.9230769230769231,
4
- "best_model_checkpoint": "model_output/checkpoint-50",
5
- "epoch": 5.0,
6
- "eval_steps": 25,
7
- "global_step": 50,
8
- "is_hyper_param_search": false,
9
- "is_local_process_zero": true,
10
- "is_world_process_zero": true,
11
- "log_history": [
12
- {
13
- "epoch": 0.5,
14
- "grad_norm": 0.7717047929763794,
15
- "learning_rate": 4.912280701754386e-05,
16
- "loss": 0.6998,
17
- "step": 5
18
- },
19
- {
20
- "epoch": 1.0,
21
- "grad_norm": 0.8567419648170471,
22
- "learning_rate": 4.473684210526316e-05,
23
- "loss": 0.6853,
24
- "step": 10
25
- },
26
- {
27
- "epoch": 1.0,
28
- "eval_accuracy": 0.5256410256410257,
29
- "eval_f1": 0.41943572726317213,
30
- "eval_f1_class_0": 0.2127659574468085,
31
- "eval_f1_class_1": 0.6605504587155964,
32
- "eval_loss": 0.6680065989494324,
33
- "eval_precision": 0.7660695468914647,
34
- "eval_precision_class_0": 1.0,
35
- "eval_precision_class_1": 0.4931506849315068,
36
- "eval_recall": 0.5256410256410257,
37
- "eval_runtime": 0.7697,
38
- "eval_samples_per_second": 101.335,
39
- "eval_steps_per_second": 2.598,
40
- "step": 10
41
- },
42
- {
43
- "epoch": 1.5,
44
- "grad_norm": 1.7958896160125732,
45
- "learning_rate": 4.0350877192982455e-05,
46
- "loss": 0.651,
47
- "step": 15
48
- },
49
- {
50
- "epoch": 2.0,
51
- "grad_norm": 2.7093613147735596,
52
- "learning_rate": 3.5964912280701756e-05,
53
- "loss": 0.5555,
54
- "step": 20
55
- },
56
- {
57
- "epoch": 2.0,
58
- "eval_accuracy": 0.7692307692307693,
59
- "eval_f1": 0.7692307692307693,
60
- "eval_f1_class_0": 0.7857142857142857,
61
- "eval_f1_class_1": 0.75,
62
- "eval_loss": 0.5287392735481262,
63
- "eval_precision": 0.7692307692307693,
64
- "eval_precision_class_0": 0.7857142857142857,
65
- "eval_precision_class_1": 0.75,
66
- "eval_recall": 0.7692307692307693,
67
- "eval_runtime": 0.6932,
68
- "eval_samples_per_second": 112.528,
69
- "eval_steps_per_second": 2.885,
70
- "step": 20
71
- },
72
- {
73
- "epoch": 2.5,
74
- "grad_norm": 2.830397129058838,
75
- "learning_rate": 3.157894736842105e-05,
76
- "loss": 0.4365,
77
- "step": 25
78
- },
79
- {
80
- "epoch": 3.0,
81
- "grad_norm": 3.684325695037842,
82
- "learning_rate": 2.7192982456140354e-05,
83
- "loss": 0.3661,
84
- "step": 30
85
- },
86
- {
87
- "epoch": 3.0,
88
- "eval_accuracy": 0.8717948717948718,
89
- "eval_f1": 0.8719638963541402,
90
- "eval_f1_class_0": 0.8780487804878049,
91
- "eval_f1_class_1": 0.8648648648648649,
92
- "eval_loss": 0.35331812500953674,
93
- "eval_precision": 0.8732793522267207,
94
- "eval_precision_class_0": 0.9,
95
- "eval_precision_class_1": 0.8421052631578947,
96
- "eval_recall": 0.8717948717948718,
97
- "eval_runtime": 0.7276,
98
- "eval_samples_per_second": 107.208,
99
- "eval_steps_per_second": 2.749,
100
- "step": 30
101
- },
102
- {
103
- "epoch": 3.5,
104
- "grad_norm": 2.4954941272735596,
105
- "learning_rate": 2.280701754385965e-05,
106
- "loss": 0.2656,
107
- "step": 35
108
- },
109
- {
110
- "epoch": 4.0,
111
- "grad_norm": 7.014026165008545,
112
- "learning_rate": 1.8421052631578947e-05,
113
- "loss": 0.1901,
114
- "step": 40
115
- },
116
- {
117
- "epoch": 4.0,
118
- "eval_accuracy": 0.8846153846153846,
119
- "eval_f1": 0.8828402366863904,
120
- "eval_f1_class_0": 0.9010989010989011,
121
- "eval_f1_class_1": 0.8615384615384616,
122
- "eval_loss": 0.3602108657360077,
123
- "eval_precision": 0.8961727927245169,
124
- "eval_precision_class_0": 0.8367346938775511,
125
- "eval_precision_class_1": 0.9655172413793104,
126
- "eval_recall": 0.8846153846153846,
127
- "eval_runtime": 0.6999,
128
- "eval_samples_per_second": 111.445,
129
- "eval_steps_per_second": 2.858,
130
- "step": 40
131
- },
132
- {
133
- "epoch": 4.5,
134
- "grad_norm": 1.7869679927825928,
135
- "learning_rate": 1.4035087719298246e-05,
136
- "loss": 0.1756,
137
- "step": 45
138
- },
139
- {
140
- "epoch": 5.0,
141
- "grad_norm": 1.1429275274276733,
142
- "learning_rate": 9.649122807017545e-06,
143
- "loss": 0.0941,
144
- "step": 50
145
- },
146
- {
147
- "epoch": 5.0,
148
- "eval_accuracy": 0.9230769230769231,
149
- "eval_f1": 0.9228724763608483,
150
- "eval_f1_class_0": 0.9302325581395349,
151
- "eval_f1_class_1": 0.9142857142857143,
152
- "eval_loss": 0.19413678348064423,
153
- "eval_precision": 0.9238996297819827,
154
- "eval_precision_class_0": 0.9090909090909091,
155
- "eval_precision_class_1": 0.9411764705882353,
156
- "eval_recall": 0.9230769230769231,
157
- "eval_runtime": 0.6829,
158
- "eval_samples_per_second": 114.219,
159
- "eval_steps_per_second": 2.929,
160
- "step": 50
161
- }
162
- ],
163
- "logging_steps": 5,
164
- "max_steps": 60,
165
- "num_input_tokens_seen": 0,
166
- "num_train_epochs": 6,
167
- "save_steps": 500,
168
- "stateful_callbacks": {
169
- "EarlyStoppingCallback": {
170
- "args": {
171
- "early_stopping_patience": 2,
172
- "early_stopping_threshold": 0.0
173
- },
174
- "attributes": {
175
- "early_stopping_patience_counter": 0
176
- }
177
- },
178
- "TrainerControl": {
179
- "args": {
180
- "should_epoch_stop": false,
181
- "should_evaluate": false,
182
- "should_log": false,
183
- "should_save": true,
184
- "should_training_stop": false
185
- },
186
- "attributes": {}
187
- }
188
- },
189
- "total_flos": 51165532730880.0,
190
- "train_batch_size": 32,
191
- "trial_name": null,
192
- "trial_params": null
193
- }