RobertoSonic commited on
Commit
f8d09b7
·
verified ·
1 Parent(s): 97b236b

End of training

Browse files
README.md CHANGED
@@ -18,7 +18,7 @@ should probably proofread and complete it, then remove this comment. -->
18
 
19
  This model is a fine-tuned version of [microsoft/swinv2-tiny-patch4-window8-256](https://huggingface.co/microsoft/swinv2-tiny-patch4-window8-256) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 1.2547
22
  - Accuracy: 0.5192
23
 
24
  ## Model description
 
18
 
19
  This model is a fine-tuned version of [microsoft/swinv2-tiny-patch4-window8-256](https://huggingface.co/microsoft/swinv2-tiny-patch4-window8-256) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
+ - Loss: 1.2286
22
  - Accuracy: 0.5192
23
 
24
  ## Model description
all_results.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 30.0,
3
+ "eval_accuracy": 0.5192307692307693,
4
+ "eval_loss": 1.2286193370819092,
5
+ "eval_runtime": 0.9797,
6
+ "eval_samples_per_second": 53.078,
7
+ "eval_steps_per_second": 2.041,
8
+ "total_flos": 7.115852825454182e+17,
9
+ "train_loss": 3.1241997612847223,
10
+ "train_runtime": 594.7221,
11
+ "train_samples_per_second": 36.773,
12
+ "train_steps_per_second": 0.151
13
+ }
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 30.0,
3
+ "eval_accuracy": 0.5192307692307693,
4
+ "eval_loss": 1.2286193370819092,
5
+ "eval_runtime": 0.9797,
6
+ "eval_samples_per_second": 53.078,
7
+ "eval_steps_per_second": 2.041
8
+ }
runs/Jan20_18-12-26_2dbac0f7b711/events.out.tfevents.1737397395.2dbac0f7b711.1282.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c0836714fb25cbbf1c347312f26e530d48a5240d6b19d82199a73312e0c0ecaa
3
+ size 405
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 30.0,
3
+ "total_flos": 7.115852825454182e+17,
4
+ "train_loss": 3.1241997612847223,
5
+ "train_runtime": 594.7221,
6
+ "train_samples_per_second": 36.773,
7
+ "train_steps_per_second": 0.151
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,375 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.5192307692307693,
3
+ "best_model_checkpoint": "swinv2-tiny-patch4-window8-256-dmae-humeda-DAV9/checkpoint-63",
4
+ "epoch": 30.0,
5
+ "eval_steps": 500,
6
+ "global_step": 90,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 1.0,
13
+ "eval_accuracy": 0.23076923076923078,
14
+ "eval_loss": 1.5944099426269531,
15
+ "eval_runtime": 0.986,
16
+ "eval_samples_per_second": 52.74,
17
+ "eval_steps_per_second": 2.028,
18
+ "step": 3
19
+ },
20
+ {
21
+ "epoch": 2.0,
22
+ "eval_accuracy": 0.2692307692307692,
23
+ "eval_loss": 1.5511040687561035,
24
+ "eval_runtime": 0.9229,
25
+ "eval_samples_per_second": 56.344,
26
+ "eval_steps_per_second": 2.167,
27
+ "step": 6
28
+ },
29
+ {
30
+ "epoch": 3.0,
31
+ "eval_accuracy": 0.34615384615384615,
32
+ "eval_loss": 1.491486668586731,
33
+ "eval_runtime": 1.2511,
34
+ "eval_samples_per_second": 41.564,
35
+ "eval_steps_per_second": 1.599,
36
+ "step": 9
37
+ },
38
+ {
39
+ "epoch": 3.3333333333333335,
40
+ "grad_norm": 9.355170249938965,
41
+ "learning_rate": 1.6666666666666667e-05,
42
+ "loss": 6.2974,
43
+ "step": 10
44
+ },
45
+ {
46
+ "epoch": 4.0,
47
+ "eval_accuracy": 0.46153846153846156,
48
+ "eval_loss": 1.4388242959976196,
49
+ "eval_runtime": 0.9203,
50
+ "eval_samples_per_second": 56.504,
51
+ "eval_steps_per_second": 2.173,
52
+ "step": 12
53
+ },
54
+ {
55
+ "epoch": 5.0,
56
+ "eval_accuracy": 0.46153846153846156,
57
+ "eval_loss": 1.3927408456802368,
58
+ "eval_runtime": 0.9499,
59
+ "eval_samples_per_second": 54.741,
60
+ "eval_steps_per_second": 2.105,
61
+ "step": 15
62
+ },
63
+ {
64
+ "epoch": 6.0,
65
+ "eval_accuracy": 0.4423076923076923,
66
+ "eval_loss": 1.3393510580062866,
67
+ "eval_runtime": 0.9523,
68
+ "eval_samples_per_second": 54.605,
69
+ "eval_steps_per_second": 2.1,
70
+ "step": 18
71
+ },
72
+ {
73
+ "epoch": 6.666666666666667,
74
+ "grad_norm": 14.36314582824707,
75
+ "learning_rate": 2.9942920471376185e-05,
76
+ "loss": 5.3611,
77
+ "step": 20
78
+ },
79
+ {
80
+ "epoch": 7.0,
81
+ "eval_accuracy": 0.4423076923076923,
82
+ "eval_loss": 1.3107666969299316,
83
+ "eval_runtime": 0.9443,
84
+ "eval_samples_per_second": 55.069,
85
+ "eval_steps_per_second": 2.118,
86
+ "step": 21
87
+ },
88
+ {
89
+ "epoch": 8.0,
90
+ "eval_accuracy": 0.34615384615384615,
91
+ "eval_loss": 1.3680166006088257,
92
+ "eval_runtime": 1.2909,
93
+ "eval_samples_per_second": 40.281,
94
+ "eval_steps_per_second": 1.549,
95
+ "step": 24
96
+ },
97
+ {
98
+ "epoch": 9.0,
99
+ "eval_accuracy": 0.40384615384615385,
100
+ "eval_loss": 1.2717851400375366,
101
+ "eval_runtime": 0.9305,
102
+ "eval_samples_per_second": 55.883,
103
+ "eval_steps_per_second": 2.149,
104
+ "step": 27
105
+ },
106
+ {
107
+ "epoch": 10.0,
108
+ "grad_norm": 21.04581642150879,
109
+ "learning_rate": 2.7990381056766583e-05,
110
+ "loss": 3.7205,
111
+ "step": 30
112
+ },
113
+ {
114
+ "epoch": 10.0,
115
+ "eval_accuracy": 0.4230769230769231,
116
+ "eval_loss": 1.2678520679473877,
117
+ "eval_runtime": 0.9355,
118
+ "eval_samples_per_second": 55.588,
119
+ "eval_steps_per_second": 2.138,
120
+ "step": 30
121
+ },
122
+ {
123
+ "epoch": 11.0,
124
+ "eval_accuracy": 0.40384615384615385,
125
+ "eval_loss": 1.3009899854660034,
126
+ "eval_runtime": 0.9418,
127
+ "eval_samples_per_second": 55.212,
128
+ "eval_steps_per_second": 2.124,
129
+ "step": 33
130
+ },
131
+ {
132
+ "epoch": 12.0,
133
+ "eval_accuracy": 0.4230769230769231,
134
+ "eval_loss": 1.2598135471343994,
135
+ "eval_runtime": 0.9337,
136
+ "eval_samples_per_second": 55.694,
137
+ "eval_steps_per_second": 2.142,
138
+ "step": 36
139
+ },
140
+ {
141
+ "epoch": 13.0,
142
+ "eval_accuracy": 0.4230769230769231,
143
+ "eval_loss": 1.2016476392745972,
144
+ "eval_runtime": 0.9331,
145
+ "eval_samples_per_second": 55.726,
146
+ "eval_steps_per_second": 2.143,
147
+ "step": 39
148
+ },
149
+ {
150
+ "epoch": 13.333333333333334,
151
+ "grad_norm": 22.220523834228516,
152
+ "learning_rate": 2.360364654526569e-05,
153
+ "loss": 2.8178,
154
+ "step": 40
155
+ },
156
+ {
157
+ "epoch": 14.0,
158
+ "eval_accuracy": 0.4423076923076923,
159
+ "eval_loss": 1.1934146881103516,
160
+ "eval_runtime": 0.938,
161
+ "eval_samples_per_second": 55.435,
162
+ "eval_steps_per_second": 2.132,
163
+ "step": 42
164
+ },
165
+ {
166
+ "epoch": 15.0,
167
+ "eval_accuracy": 0.4807692307692308,
168
+ "eval_loss": 1.1842211484909058,
169
+ "eval_runtime": 1.3187,
170
+ "eval_samples_per_second": 39.433,
171
+ "eval_steps_per_second": 1.517,
172
+ "step": 45
173
+ },
174
+ {
175
+ "epoch": 16.0,
176
+ "eval_accuracy": 0.5,
177
+ "eval_loss": 1.15390944480896,
178
+ "eval_runtime": 0.9603,
179
+ "eval_samples_per_second": 54.152,
180
+ "eval_steps_per_second": 2.083,
181
+ "step": 48
182
+ },
183
+ {
184
+ "epoch": 16.666666666666668,
185
+ "grad_norm": 24.42645263671875,
186
+ "learning_rate": 1.760472266500396e-05,
187
+ "loss": 2.4001,
188
+ "step": 50
189
+ },
190
+ {
191
+ "epoch": 17.0,
192
+ "eval_accuracy": 0.4807692307692308,
193
+ "eval_loss": 1.1308224201202393,
194
+ "eval_runtime": 0.9273,
195
+ "eval_samples_per_second": 56.077,
196
+ "eval_steps_per_second": 2.157,
197
+ "step": 51
198
+ },
199
+ {
200
+ "epoch": 18.0,
201
+ "eval_accuracy": 0.46153846153846156,
202
+ "eval_loss": 1.217308521270752,
203
+ "eval_runtime": 0.926,
204
+ "eval_samples_per_second": 56.154,
205
+ "eval_steps_per_second": 2.16,
206
+ "step": 54
207
+ },
208
+ {
209
+ "epoch": 19.0,
210
+ "eval_accuracy": 0.5,
211
+ "eval_loss": 1.1669617891311646,
212
+ "eval_runtime": 0.9426,
213
+ "eval_samples_per_second": 55.165,
214
+ "eval_steps_per_second": 2.122,
215
+ "step": 57
216
+ },
217
+ {
218
+ "epoch": 20.0,
219
+ "grad_norm": 23.83008575439453,
220
+ "learning_rate": 1.1117714323462188e-05,
221
+ "loss": 2.081,
222
+ "step": 60
223
+ },
224
+ {
225
+ "epoch": 20.0,
226
+ "eval_accuracy": 0.5,
227
+ "eval_loss": 1.1792218685150146,
228
+ "eval_runtime": 0.9338,
229
+ "eval_samples_per_second": 55.688,
230
+ "eval_steps_per_second": 2.142,
231
+ "step": 60
232
+ },
233
+ {
234
+ "epoch": 21.0,
235
+ "eval_accuracy": 0.5192307692307693,
236
+ "eval_loss": 1.2286193370819092,
237
+ "eval_runtime": 0.9342,
238
+ "eval_samples_per_second": 55.66,
239
+ "eval_steps_per_second": 2.141,
240
+ "step": 63
241
+ },
242
+ {
243
+ "epoch": 22.0,
244
+ "eval_accuracy": 0.5,
245
+ "eval_loss": 1.26326322555542,
246
+ "eval_runtime": 1.1302,
247
+ "eval_samples_per_second": 46.008,
248
+ "eval_steps_per_second": 1.77,
249
+ "step": 66
250
+ },
251
+ {
252
+ "epoch": 23.0,
253
+ "eval_accuracy": 0.5,
254
+ "eval_loss": 1.2379720211029053,
255
+ "eval_runtime": 0.9486,
256
+ "eval_samples_per_second": 54.817,
257
+ "eval_steps_per_second": 2.108,
258
+ "step": 69
259
+ },
260
+ {
261
+ "epoch": 23.333333333333332,
262
+ "grad_norm": 18.731117248535156,
263
+ "learning_rate": 5.3581858547019095e-06,
264
+ "loss": 1.8588,
265
+ "step": 70
266
+ },
267
+ {
268
+ "epoch": 24.0,
269
+ "eval_accuracy": 0.4807692307692308,
270
+ "eval_loss": 1.24978768825531,
271
+ "eval_runtime": 1.2983,
272
+ "eval_samples_per_second": 40.053,
273
+ "eval_steps_per_second": 1.54,
274
+ "step": 72
275
+ },
276
+ {
277
+ "epoch": 25.0,
278
+ "eval_accuracy": 0.5,
279
+ "eval_loss": 1.2591068744659424,
280
+ "eval_runtime": 0.9309,
281
+ "eval_samples_per_second": 55.857,
282
+ "eval_steps_per_second": 2.148,
283
+ "step": 75
284
+ },
285
+ {
286
+ "epoch": 26.0,
287
+ "eval_accuracy": 0.5,
288
+ "eval_loss": 1.2652957439422607,
289
+ "eval_runtime": 0.9419,
290
+ "eval_samples_per_second": 55.21,
291
+ "eval_steps_per_second": 2.123,
292
+ "step": 78
293
+ },
294
+ {
295
+ "epoch": 26.666666666666668,
296
+ "grad_norm": 19.568700790405273,
297
+ "learning_rate": 1.4053831944502509e-06,
298
+ "loss": 1.7634,
299
+ "step": 80
300
+ },
301
+ {
302
+ "epoch": 27.0,
303
+ "eval_accuracy": 0.5,
304
+ "eval_loss": 1.259857177734375,
305
+ "eval_runtime": 0.9424,
306
+ "eval_samples_per_second": 55.178,
307
+ "eval_steps_per_second": 2.122,
308
+ "step": 81
309
+ },
310
+ {
311
+ "epoch": 28.0,
312
+ "eval_accuracy": 0.5,
313
+ "eval_loss": 1.2548739910125732,
314
+ "eval_runtime": 0.9289,
315
+ "eval_samples_per_second": 55.978,
316
+ "eval_steps_per_second": 2.153,
317
+ "step": 84
318
+ },
319
+ {
320
+ "epoch": 29.0,
321
+ "eval_accuracy": 0.5192307692307693,
322
+ "eval_loss": 1.2544516324996948,
323
+ "eval_runtime": 1.0558,
324
+ "eval_samples_per_second": 49.25,
325
+ "eval_steps_per_second": 1.894,
326
+ "step": 87
327
+ },
328
+ {
329
+ "epoch": 30.0,
330
+ "grad_norm": 25.50164222717285,
331
+ "learning_rate": 0.0,
332
+ "loss": 1.8177,
333
+ "step": 90
334
+ },
335
+ {
336
+ "epoch": 30.0,
337
+ "eval_accuracy": 0.5192307692307693,
338
+ "eval_loss": 1.2546559572219849,
339
+ "eval_runtime": 1.2806,
340
+ "eval_samples_per_second": 40.606,
341
+ "eval_steps_per_second": 1.562,
342
+ "step": 90
343
+ },
344
+ {
345
+ "epoch": 30.0,
346
+ "step": 90,
347
+ "total_flos": 7.115852825454182e+17,
348
+ "train_loss": 3.1241997612847223,
349
+ "train_runtime": 594.7221,
350
+ "train_samples_per_second": 36.773,
351
+ "train_steps_per_second": 0.151
352
+ }
353
+ ],
354
+ "logging_steps": 10,
355
+ "max_steps": 90,
356
+ "num_input_tokens_seen": 0,
357
+ "num_train_epochs": 30,
358
+ "save_steps": 500,
359
+ "stateful_callbacks": {
360
+ "TrainerControl": {
361
+ "args": {
362
+ "should_epoch_stop": false,
363
+ "should_evaluate": false,
364
+ "should_log": false,
365
+ "should_save": true,
366
+ "should_training_stop": true
367
+ },
368
+ "attributes": {}
369
+ }
370
+ },
371
+ "total_flos": 7.115852825454182e+17,
372
+ "train_batch_size": 64,
373
+ "trial_name": null,
374
+ "trial_params": null
375
+ }