koke143 commited on
Commit
2191f4b
·
verified ·
1 Parent(s): b3dbba4

Delete trainer_state.json

Browse files
Files changed (1) hide show
  1. trainer_state.json +0 -177
trainer_state.json DELETED
@@ -1,177 +0,0 @@
1
- {
2
- "best_metric": 0.31034482758620696,
3
- "best_model_checkpoint": "./models/checkpoint/checkpoint-68",
4
- "epoch": 9.275862068965518,
5
- "eval_steps": 500,
6
- "global_step": 80,
7
- "is_hyper_param_search": false,
8
- "is_local_process_zero": true,
9
- "is_world_process_zero": true,
10
- "log_history": [
11
- {
12
- "epoch": 0.9195402298850575,
13
- "eval_f1": 0.2727272727272727,
14
- "eval_loss": 9.31263256072998,
15
- "eval_runtime": 0.1958,
16
- "eval_samples_per_second": 51.067,
17
- "eval_steps_per_second": 25.534,
18
- "step": 8
19
- },
20
- {
21
- "epoch": 0.9195402298850575,
22
- "step": 8,
23
- "total_flos": 20939936811486.0,
24
- "train_loss": 9.918171882629395,
25
- "train_runtime": 21.4307,
26
- "train_samples_per_second": 4.06,
27
- "train_steps_per_second": 0.373
28
- },
29
- {
30
- "epoch": 0.9195402298850575,
31
- "step": 8,
32
- "total_flos": 20939936811486.0,
33
- "train_loss": 0.0,
34
- "train_runtime": 0.5294,
35
- "train_samples_per_second": 164.352,
36
- "train_steps_per_second": 15.113
37
- },
38
- {
39
- "epoch": 1.9195402298850575,
40
- "eval_f1": 0.2530120481927711,
41
- "eval_loss": 9.20499038696289,
42
- "eval_runtime": 0.1794,
43
- "eval_samples_per_second": 55.739,
44
- "eval_steps_per_second": 27.87,
45
- "step": 16
46
- },
47
- {
48
- "epoch": 2.954022988505747,
49
- "eval_f1": 0.25842696629213485,
50
- "eval_loss": 8.635601997375488,
51
- "eval_runtime": 0.1743,
52
- "eval_samples_per_second": 57.382,
53
- "eval_steps_per_second": 28.691,
54
- "step": 25
55
- },
56
- {
57
- "epoch": 3.9885057471264367,
58
- "eval_f1": 0.30409356725146197,
59
- "eval_loss": 8.560417175292969,
60
- "eval_runtime": 0.1737,
61
- "eval_samples_per_second": 57.572,
62
- "eval_steps_per_second": 28.786,
63
- "step": 34
64
- },
65
- {
66
- "epoch": 4.908045977011494,
67
- "eval_f1": 0.3076923076923077,
68
- "eval_loss": 8.47392463684082,
69
- "eval_runtime": 0.1856,
70
- "eval_samples_per_second": 53.876,
71
- "eval_steps_per_second": 26.938,
72
- "step": 42
73
- },
74
- {
75
- "epoch": 5.942528735632184,
76
- "eval_f1": 0.30857142857142855,
77
- "eval_loss": 8.22740364074707,
78
- "eval_runtime": 0.1773,
79
- "eval_samples_per_second": 56.411,
80
- "eval_steps_per_second": 28.205,
81
- "step": 51
82
- },
83
- {
84
- "epoch": 6.977011494252873,
85
- "eval_f1": 0.3,
86
- "eval_loss": 8.102139472961426,
87
- "eval_runtime": 0.1819,
88
- "eval_samples_per_second": 54.979,
89
- "eval_steps_per_second": 27.49,
90
- "step": 60
91
- },
92
- {
93
- "epoch": 7.896551724137931,
94
- "eval_f1": 0.31034482758620696,
95
- "eval_loss": 7.982325553894043,
96
- "eval_runtime": 0.1721,
97
- "eval_samples_per_second": 58.115,
98
- "eval_steps_per_second": 29.057,
99
- "step": 68
100
- },
101
- {
102
- "epoch": 8.931034482758621,
103
- "eval_f1": 0.30681818181818177,
104
- "eval_loss": 7.987342834472656,
105
- "eval_runtime": 0.1737,
106
- "eval_samples_per_second": 57.583,
107
- "eval_steps_per_second": 28.792,
108
- "step": 77
109
- },
110
- {
111
- "epoch": 9.275862068965518,
112
- "eval_f1": 0.30681818181818177,
113
- "eval_loss": 7.902113437652588,
114
- "eval_runtime": 0.1822,
115
- "eval_samples_per_second": 54.889,
116
- "eval_steps_per_second": 27.444,
117
- "step": 80
118
- },
119
- {
120
- "epoch": 9.275862068965518,
121
- "step": 80,
122
- "total_flos": 202609940734866.0,
123
- "train_loss": 7.418544769287109,
124
- "train_runtime": 132.4614,
125
- "train_samples_per_second": 6.568,
126
- "train_steps_per_second": 0.604
127
- },
128
- {
129
- "epoch": 9.275862068965518,
130
- "step": 80,
131
- "total_flos": 202609940734866.0,
132
- "train_loss": 0.0,
133
- "train_runtime": 0.245,
134
- "train_samples_per_second": 355.061,
135
- "train_steps_per_second": 32.649
136
- },
137
- {
138
- "epoch": 9.275862068965518,
139
- "step": 80,
140
- "total_flos": 202609940734866.0,
141
- "train_loss": 0.0,
142
- "train_runtime": 0.244,
143
- "train_samples_per_second": 356.519,
144
- "train_steps_per_second": 32.783
145
- }
146
- ],
147
- "logging_steps": 500,
148
- "max_steps": 8,
149
- "num_input_tokens_seen": 0,
150
- "num_train_epochs": 1,
151
- "save_steps": 500,
152
- "stateful_callbacks": {
153
- "EarlyStoppingCallback": {
154
- "args": {
155
- "early_stopping_patience": 3,
156
- "early_stopping_threshold": 0.0
157
- },
158
- "attributes": {
159
- "early_stopping_patience_counter": 0
160
- }
161
- },
162
- "TrainerControl": {
163
- "args": {
164
- "should_epoch_stop": false,
165
- "should_evaluate": false,
166
- "should_log": false,
167
- "should_save": true,
168
- "should_training_stop": true
169
- },
170
- "attributes": {}
171
- }
172
- },
173
- "total_flos": 202609940734866.0,
174
- "train_batch_size": 1,
175
- "trial_name": null,
176
- "trial_params": null
177
- }