AnnyNguyen commited on
Commit
40c9390
·
verified ·
1 Parent(s): 845ec66

Delete checkpoint-1566/trainer_state.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. checkpoint-1566/trainer_state.json +0 -196
checkpoint-1566/trainer_state.json DELETED
@@ -1,196 +0,0 @@
1
- {
2
- "best_global_step": 1566,
3
- "best_metric": 0.5676447814653858,
4
- "best_model_checkpoint": "outputs/bartpho/checkpoint-1566",
5
- "epoch": 9.0,
6
- "eval_steps": 500,
7
- "global_step": 1566,
8
- "is_hyper_param_search": false,
9
- "is_local_process_zero": true,
10
- "is_world_process_zero": true,
11
- "log_history": [
12
- {
13
- "epoch": 0.9942528735632183,
14
- "grad_norm": 8.253643035888672,
15
- "learning_rate": 6.88e-06,
16
- "loss": 1.7722,
17
- "step": 173
18
- },
19
- {
20
- "epoch": 1.0,
21
- "eval_accuracy": 0.35422740524781343,
22
- "eval_loss": 1.6894474029541016,
23
- "eval_macro_f1": 0.16483983747511713,
24
- "eval_runtime": 4.6188,
25
- "eval_samples_per_second": 148.524,
26
- "eval_steps_per_second": 4.763,
27
- "step": 174
28
- },
29
- {
30
- "epoch": 1.9885057471264367,
31
- "grad_norm": 10.314130783081055,
32
- "learning_rate": 1.38e-05,
33
- "loss": 1.5474,
34
- "step": 346
35
- },
36
- {
37
- "epoch": 2.0,
38
- "eval_accuracy": 0.49416909620991256,
39
- "eval_loss": 1.3798141479492188,
40
- "eval_macro_f1": 0.33564178199668815,
41
- "eval_runtime": 4.6167,
42
- "eval_samples_per_second": 148.592,
43
- "eval_steps_per_second": 4.765,
44
- "step": 348
45
- },
46
- {
47
- "epoch": 2.9827586206896552,
48
- "grad_norm": 11.580602645874023,
49
- "learning_rate": 1.999994401896218e-05,
50
- "loss": 1.3036,
51
- "step": 519
52
- },
53
- {
54
- "epoch": 3.0,
55
- "eval_accuracy": 0.5728862973760933,
56
- "eval_loss": 1.1752054691314697,
57
- "eval_macro_f1": 0.4355327116696494,
58
- "eval_runtime": 4.6311,
59
- "eval_samples_per_second": 148.13,
60
- "eval_steps_per_second": 4.751,
61
- "step": 522
62
- },
63
- {
64
- "epoch": 3.9770114942528734,
65
- "grad_norm": 14.440051078796387,
66
- "learning_rate": 1.9993697433304146e-05,
67
- "loss": 1.1727,
68
- "step": 692
69
- },
70
- {
71
- "epoch": 4.0,
72
- "eval_accuracy": 0.5787172011661808,
73
- "eval_loss": 1.1525901556015015,
74
- "eval_macro_f1": 0.4912122989755165,
75
- "eval_runtime": 4.6769,
76
- "eval_samples_per_second": 146.679,
77
- "eval_steps_per_second": 4.704,
78
- "step": 696
79
- },
80
- {
81
- "epoch": 4.971264367816092,
82
- "grad_norm": 13.43419361114502,
83
- "learning_rate": 1.9977115923137912e-05,
84
- "loss": 1.0254,
85
- "step": 865
86
- },
87
- {
88
- "epoch": 5.0,
89
- "eval_accuracy": 0.5932944606413995,
90
- "eval_loss": 1.1551982164382935,
91
- "eval_macro_f1": 0.5047627462427012,
92
- "eval_runtime": 4.7431,
93
- "eval_samples_per_second": 144.632,
94
- "eval_steps_per_second": 4.638,
95
- "step": 870
96
- },
97
- {
98
- "epoch": 5.9655172413793105,
99
- "grad_norm": 13.305834770202637,
100
- "learning_rate": 1.995021663613649e-05,
101
- "loss": 0.8855,
102
- "step": 1038
103
- },
104
- {
105
- "epoch": 6.0,
106
- "eval_accuracy": 0.5860058309037901,
107
- "eval_loss": 1.0997425317764282,
108
- "eval_macro_f1": 0.5274407663166836,
109
- "eval_runtime": 4.6958,
110
- "eval_samples_per_second": 146.087,
111
- "eval_steps_per_second": 4.685,
112
- "step": 1044
113
- },
114
- {
115
- "epoch": 6.959770114942529,
116
- "grad_norm": 11.853787422180176,
117
- "learning_rate": 1.991302739004225e-05,
118
- "loss": 0.7547,
119
- "step": 1211
120
- },
121
- {
122
- "epoch": 7.0,
123
- "eval_accuracy": 0.5816326530612245,
124
- "eval_loss": 1.2447866201400757,
125
- "eval_macro_f1": 0.5071616053303554,
126
- "eval_runtime": 4.6271,
127
- "eval_samples_per_second": 148.256,
128
- "eval_steps_per_second": 4.755,
129
- "step": 1218
130
- },
131
- {
132
- "epoch": 7.954022988505747,
133
- "grad_norm": 13.94935417175293,
134
- "learning_rate": 1.9865586643899352e-05,
135
- "loss": 0.6322,
136
- "step": 1384
137
- },
138
- {
139
- "epoch": 8.0,
140
- "eval_accuracy": 0.575801749271137,
141
- "eval_loss": 1.263814091682434,
142
- "eval_macro_f1": 0.5216417103369302,
143
- "eval_runtime": 4.6197,
144
- "eval_samples_per_second": 148.494,
145
- "eval_steps_per_second": 4.762,
146
- "step": 1392
147
- },
148
- {
149
- "epoch": 8.948275862068966,
150
- "grad_norm": 13.111533164978027,
151
- "learning_rate": 1.9807943458281543e-05,
152
- "loss": 0.4984,
153
- "step": 1557
154
- },
155
- {
156
- "epoch": 9.0,
157
- "eval_accuracy": 0.6020408163265306,
158
- "eval_loss": 1.3265769481658936,
159
- "eval_macro_f1": 0.5676447814653858,
160
- "eval_runtime": 4.6357,
161
- "eval_samples_per_second": 147.98,
162
- "eval_steps_per_second": 4.746,
163
- "step": 1566
164
- }
165
- ],
166
- "logging_steps": 173,
167
- "max_steps": 17400,
168
- "num_input_tokens_seen": 0,
169
- "num_train_epochs": 100,
170
- "save_steps": 500,
171
- "stateful_callbacks": {
172
- "EarlyStoppingCallback": {
173
- "args": {
174
- "early_stopping_patience": 5,
175
- "early_stopping_threshold": 0.0
176
- },
177
- "attributes": {
178
- "early_stopping_patience_counter": 0
179
- }
180
- },
181
- "TrainerControl": {
182
- "args": {
183
- "should_epoch_stop": false,
184
- "should_evaluate": false,
185
- "should_log": false,
186
- "should_save": true,
187
- "should_training_stop": false
188
- },
189
- "attributes": {}
190
- }
191
- },
192
- "total_flos": 2.0879945994205656e+16,
193
- "train_batch_size": 32,
194
- "trial_name": null,
195
- "trial_params": null
196
- }