RobertoSonic commited on
Commit
667d004
·
verified ·
1 Parent(s): b812877

End of training

Browse files
README.md CHANGED
@@ -18,7 +18,7 @@ should probably proofread and complete it, then remove this comment. -->
18
 
19
  This model is a fine-tuned version of [microsoft/swinv2-tiny-patch4-window8-256](https://huggingface.co/microsoft/swinv2-tiny-patch4-window8-256) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 1.8446
22
  - Accuracy: 0.6538
23
 
24
  ## Model description
 
18
 
19
  This model is a fine-tuned version of [microsoft/swinv2-tiny-patch4-window8-256](https://huggingface.co/microsoft/swinv2-tiny-patch4-window8-256) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
+ - Loss: 1.8351
22
  - Accuracy: 0.6538
23
 
24
  ## Model description
all_results.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 29.8,
3
+ "eval_accuracy": 0.6538461538461539,
4
+ "eval_loss": 1.8350580930709839,
5
+ "eval_runtime": 1.9929,
6
+ "eval_samples_per_second": 52.185,
7
+ "eval_steps_per_second": 2.007,
8
+ "total_flos": 3.1009435460901274e+17,
9
+ "train_loss": 1.446416116754214,
10
+ "train_runtime": 581.9968,
11
+ "train_samples_per_second": 23.969,
12
+ "train_steps_per_second": 0.155
13
+ }
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 29.8,
3
+ "eval_accuracy": 0.6538461538461539,
4
+ "eval_loss": 1.8350580930709839,
5
+ "eval_runtime": 1.9929,
6
+ "eval_samples_per_second": 52.185,
7
+ "eval_steps_per_second": 2.007
8
+ }
runs/Feb04_02-12-51_ad369e174003/events.out.tfevents.1738635783.ad369e174003.1285.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:567b4445b1a44260c1690f7432567aa3e315bb64f583e24ed18c83b0e741e5a5
3
+ size 405
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 29.8,
3
+ "total_flos": 3.1009435460901274e+17,
4
+ "train_loss": 1.446416116754214,
5
+ "train_runtime": 581.9968,
6
+ "train_samples_per_second": 23.969,
7
+ "train_steps_per_second": 0.155
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,361 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.6538461538461539,
3
+ "best_model_checkpoint": "swinv2-tiny-patch4-window8-256-dmae-humeda-DAV37/checkpoint-54",
4
+ "epoch": 29.8,
5
+ "eval_steps": 500,
6
+ "global_step": 90,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.8,
13
+ "eval_accuracy": 0.1346153846153846,
14
+ "eval_loss": 1.6284154653549194,
15
+ "eval_runtime": 1.4528,
16
+ "eval_samples_per_second": 71.585,
17
+ "eval_steps_per_second": 2.753,
18
+ "step": 3
19
+ },
20
+ {
21
+ "epoch": 1.8,
22
+ "eval_accuracy": 0.2403846153846154,
23
+ "eval_loss": 1.5965616703033447,
24
+ "eval_runtime": 1.4255,
25
+ "eval_samples_per_second": 72.959,
26
+ "eval_steps_per_second": 2.806,
27
+ "step": 6
28
+ },
29
+ {
30
+ "epoch": 2.8,
31
+ "eval_accuracy": 0.3942307692307692,
32
+ "eval_loss": 1.5076172351837158,
33
+ "eval_runtime": 1.9058,
34
+ "eval_samples_per_second": 54.57,
35
+ "eval_steps_per_second": 2.099,
36
+ "step": 9
37
+ },
38
+ {
39
+ "epoch": 3.8,
40
+ "grad_norm": 30.521873474121094,
41
+ "learning_rate": 4.983095894354858e-05,
42
+ "loss": 6.28,
43
+ "step": 12
44
+ },
45
+ {
46
+ "epoch": 3.8,
47
+ "eval_accuracy": 0.46153846153846156,
48
+ "eval_loss": 1.2911909818649292,
49
+ "eval_runtime": 1.4733,
50
+ "eval_samples_per_second": 70.589,
51
+ "eval_steps_per_second": 2.715,
52
+ "step": 12
53
+ },
54
+ {
55
+ "epoch": 4.8,
56
+ "eval_accuracy": 0.5096153846153846,
57
+ "eval_loss": 1.2136619091033936,
58
+ "eval_runtime": 1.4295,
59
+ "eval_samples_per_second": 72.754,
60
+ "eval_steps_per_second": 2.798,
61
+ "step": 15
62
+ },
63
+ {
64
+ "epoch": 5.8,
65
+ "eval_accuracy": 0.5384615384615384,
66
+ "eval_loss": 1.1916911602020264,
67
+ "eval_runtime": 1.4167,
68
+ "eval_samples_per_second": 73.411,
69
+ "eval_steps_per_second": 2.823,
70
+ "step": 18
71
+ },
72
+ {
73
+ "epoch": 6.8,
74
+ "eval_accuracy": 0.5673076923076923,
75
+ "eval_loss": 1.1497925519943237,
76
+ "eval_runtime": 1.4207,
77
+ "eval_samples_per_second": 73.205,
78
+ "eval_steps_per_second": 2.816,
79
+ "step": 21
80
+ },
81
+ {
82
+ "epoch": 7.8,
83
+ "grad_norm": 21.03725814819336,
84
+ "learning_rate": 4.588719528532342e-05,
85
+ "loss": 2.9539,
86
+ "step": 24
87
+ },
88
+ {
89
+ "epoch": 7.8,
90
+ "eval_accuracy": 0.5865384615384616,
91
+ "eval_loss": 1.202553629875183,
92
+ "eval_runtime": 1.8718,
93
+ "eval_samples_per_second": 55.562,
94
+ "eval_steps_per_second": 2.137,
95
+ "step": 24
96
+ },
97
+ {
98
+ "epoch": 8.8,
99
+ "eval_accuracy": 0.5961538461538461,
100
+ "eval_loss": 1.2710736989974976,
101
+ "eval_runtime": 1.845,
102
+ "eval_samples_per_second": 56.369,
103
+ "eval_steps_per_second": 2.168,
104
+ "step": 27
105
+ },
106
+ {
107
+ "epoch": 9.8,
108
+ "eval_accuracy": 0.625,
109
+ "eval_loss": 1.3533679246902466,
110
+ "eval_runtime": 1.412,
111
+ "eval_samples_per_second": 73.654,
112
+ "eval_steps_per_second": 2.833,
113
+ "step": 30
114
+ },
115
+ {
116
+ "epoch": 10.8,
117
+ "eval_accuracy": 0.625,
118
+ "eval_loss": 1.3210114240646362,
119
+ "eval_runtime": 1.4139,
120
+ "eval_samples_per_second": 73.555,
121
+ "eval_steps_per_second": 2.829,
122
+ "step": 33
123
+ },
124
+ {
125
+ "epoch": 11.8,
126
+ "grad_norm": 31.268625259399414,
127
+ "learning_rate": 3.7500000000000003e-05,
128
+ "loss": 0.9643,
129
+ "step": 36
130
+ },
131
+ {
132
+ "epoch": 11.8,
133
+ "eval_accuracy": 0.6346153846153846,
134
+ "eval_loss": 1.394026279449463,
135
+ "eval_runtime": 1.4476,
136
+ "eval_samples_per_second": 71.841,
137
+ "eval_steps_per_second": 2.763,
138
+ "step": 36
139
+ },
140
+ {
141
+ "epoch": 12.8,
142
+ "eval_accuracy": 0.6346153846153846,
143
+ "eval_loss": 1.4859095811843872,
144
+ "eval_runtime": 1.9438,
145
+ "eval_samples_per_second": 53.502,
146
+ "eval_steps_per_second": 2.058,
147
+ "step": 39
148
+ },
149
+ {
150
+ "epoch": 13.8,
151
+ "eval_accuracy": 0.6346153846153846,
152
+ "eval_loss": 1.4965322017669678,
153
+ "eval_runtime": 1.4426,
154
+ "eval_samples_per_second": 72.093,
155
+ "eval_steps_per_second": 2.773,
156
+ "step": 42
157
+ },
158
+ {
159
+ "epoch": 14.8,
160
+ "eval_accuracy": 0.625,
161
+ "eval_loss": 1.5463168621063232,
162
+ "eval_runtime": 1.4453,
163
+ "eval_samples_per_second": 71.956,
164
+ "eval_steps_per_second": 2.768,
165
+ "step": 45
166
+ },
167
+ {
168
+ "epoch": 15.8,
169
+ "grad_norm": 22.09276008605957,
170
+ "learning_rate": 2.6453620722761896e-05,
171
+ "loss": 0.3275,
172
+ "step": 48
173
+ },
174
+ {
175
+ "epoch": 15.8,
176
+ "eval_accuracy": 0.6346153846153846,
177
+ "eval_loss": 1.5884944200515747,
178
+ "eval_runtime": 1.5085,
179
+ "eval_samples_per_second": 68.944,
180
+ "eval_steps_per_second": 2.652,
181
+ "step": 48
182
+ },
183
+ {
184
+ "epoch": 16.8,
185
+ "eval_accuracy": 0.6442307692307693,
186
+ "eval_loss": 1.6466037034988403,
187
+ "eval_runtime": 1.9209,
188
+ "eval_samples_per_second": 54.142,
189
+ "eval_steps_per_second": 2.082,
190
+ "step": 51
191
+ },
192
+ {
193
+ "epoch": 17.8,
194
+ "eval_accuracy": 0.6538461538461539,
195
+ "eval_loss": 1.8350580930709839,
196
+ "eval_runtime": 1.4271,
197
+ "eval_samples_per_second": 72.873,
198
+ "eval_steps_per_second": 2.803,
199
+ "step": 54
200
+ },
201
+ {
202
+ "epoch": 18.8,
203
+ "eval_accuracy": 0.6442307692307693,
204
+ "eval_loss": 1.8326284885406494,
205
+ "eval_runtime": 1.4279,
206
+ "eval_samples_per_second": 72.832,
207
+ "eval_steps_per_second": 2.801,
208
+ "step": 57
209
+ },
210
+ {
211
+ "epoch": 19.8,
212
+ "grad_norm": 31.147811889648438,
213
+ "learning_rate": 1.509800584902108e-05,
214
+ "loss": 0.1501,
215
+ "step": 60
216
+ },
217
+ {
218
+ "epoch": 19.8,
219
+ "eval_accuracy": 0.6346153846153846,
220
+ "eval_loss": 1.7521249055862427,
221
+ "eval_runtime": 1.4343,
222
+ "eval_samples_per_second": 72.507,
223
+ "eval_steps_per_second": 2.789,
224
+ "step": 60
225
+ },
226
+ {
227
+ "epoch": 20.8,
228
+ "eval_accuracy": 0.6538461538461539,
229
+ "eval_loss": 1.780649185180664,
230
+ "eval_runtime": 1.8229,
231
+ "eval_samples_per_second": 57.051,
232
+ "eval_steps_per_second": 2.194,
233
+ "step": 63
234
+ },
235
+ {
236
+ "epoch": 21.8,
237
+ "eval_accuracy": 0.6538461538461539,
238
+ "eval_loss": 1.766915202140808,
239
+ "eval_runtime": 1.7174,
240
+ "eval_samples_per_second": 60.557,
241
+ "eval_steps_per_second": 2.329,
242
+ "step": 66
243
+ },
244
+ {
245
+ "epoch": 22.8,
246
+ "eval_accuracy": 0.6346153846153846,
247
+ "eval_loss": 1.8873956203460693,
248
+ "eval_runtime": 1.4404,
249
+ "eval_samples_per_second": 72.202,
250
+ "eval_steps_per_second": 2.777,
251
+ "step": 69
252
+ },
253
+ {
254
+ "epoch": 23.8,
255
+ "grad_norm": 9.280792236328125,
256
+ "learning_rate": 5.848888922025553e-06,
257
+ "loss": 0.09,
258
+ "step": 72
259
+ },
260
+ {
261
+ "epoch": 23.8,
262
+ "eval_accuracy": 0.6538461538461539,
263
+ "eval_loss": 1.8826991319656372,
264
+ "eval_runtime": 1.431,
265
+ "eval_samples_per_second": 72.678,
266
+ "eval_steps_per_second": 2.795,
267
+ "step": 72
268
+ },
269
+ {
270
+ "epoch": 24.8,
271
+ "eval_accuracy": 0.6538461538461539,
272
+ "eval_loss": 1.8329722881317139,
273
+ "eval_runtime": 1.9352,
274
+ "eval_samples_per_second": 53.742,
275
+ "eval_steps_per_second": 2.067,
276
+ "step": 75
277
+ },
278
+ {
279
+ "epoch": 25.8,
280
+ "eval_accuracy": 0.6538461538461539,
281
+ "eval_loss": 1.8330668210983276,
282
+ "eval_runtime": 1.5124,
283
+ "eval_samples_per_second": 68.765,
284
+ "eval_steps_per_second": 2.645,
285
+ "step": 78
286
+ },
287
+ {
288
+ "epoch": 26.8,
289
+ "eval_accuracy": 0.6538461538461539,
290
+ "eval_loss": 1.841007947921753,
291
+ "eval_runtime": 1.438,
292
+ "eval_samples_per_second": 72.324,
293
+ "eval_steps_per_second": 2.782,
294
+ "step": 81
295
+ },
296
+ {
297
+ "epoch": 27.8,
298
+ "grad_norm": 13.664288520812988,
299
+ "learning_rate": 6.738782355044049e-07,
300
+ "loss": 0.0595,
301
+ "step": 84
302
+ },
303
+ {
304
+ "epoch": 27.8,
305
+ "eval_accuracy": 0.6442307692307693,
306
+ "eval_loss": 1.8440735340118408,
307
+ "eval_runtime": 1.4316,
308
+ "eval_samples_per_second": 72.647,
309
+ "eval_steps_per_second": 2.794,
310
+ "step": 84
311
+ },
312
+ {
313
+ "epoch": 28.8,
314
+ "eval_accuracy": 0.6538461538461539,
315
+ "eval_loss": 1.8444327116012573,
316
+ "eval_runtime": 1.7905,
317
+ "eval_samples_per_second": 58.086,
318
+ "eval_steps_per_second": 2.234,
319
+ "step": 87
320
+ },
321
+ {
322
+ "epoch": 29.8,
323
+ "eval_accuracy": 0.6538461538461539,
324
+ "eval_loss": 1.844649076461792,
325
+ "eval_runtime": 1.7539,
326
+ "eval_samples_per_second": 59.298,
327
+ "eval_steps_per_second": 2.281,
328
+ "step": 90
329
+ },
330
+ {
331
+ "epoch": 29.8,
332
+ "step": 90,
333
+ "total_flos": 3.1009435460901274e+17,
334
+ "train_loss": 1.446416116754214,
335
+ "train_runtime": 581.9968,
336
+ "train_samples_per_second": 23.969,
337
+ "train_steps_per_second": 0.155
338
+ }
339
+ ],
340
+ "logging_steps": 12,
341
+ "max_steps": 90,
342
+ "num_input_tokens_seen": 0,
343
+ "num_train_epochs": 30,
344
+ "save_steps": 500,
345
+ "stateful_callbacks": {
346
+ "TrainerControl": {
347
+ "args": {
348
+ "should_epoch_stop": false,
349
+ "should_evaluate": false,
350
+ "should_log": false,
351
+ "should_save": true,
352
+ "should_training_stop": true
353
+ },
354
+ "attributes": {}
355
+ }
356
+ },
357
+ "total_flos": 3.1009435460901274e+17,
358
+ "train_batch_size": 32,
359
+ "trial_name": null,
360
+ "trial_params": null
361
+ }