RobertoSonic commited on
Commit
fbc81c4
·
verified ·
1 Parent(s): 86d209e

End of training

Browse files
README.md CHANGED
@@ -18,8 +18,8 @@ should probably proofread and complete it, then remove this comment. -->
18
 
19
  This model is a fine-tuned version of [microsoft/swinv2-tiny-patch4-window8-256](https://huggingface.co/microsoft/swinv2-tiny-patch4-window8-256) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 0.8094
22
- - Accuracy: 0.7386
23
 
24
  ## Model description
25
 
 
18
 
19
  This model is a fine-tuned version of [microsoft/swinv2-tiny-patch4-window8-256](https://huggingface.co/microsoft/swinv2-tiny-patch4-window8-256) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
+ - Loss: 0.7753
22
+ - Accuracy: 0.75
23
 
24
  ## Model description
25
 
all_results.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 33.38095238095238,
3
+ "eval_accuracy": 0.75,
4
+ "eval_loss": 0.7753319144248962,
5
+ "eval_runtime": 1.5195,
6
+ "eval_samples_per_second": 57.914,
7
+ "eval_steps_per_second": 1.974,
8
+ "total_flos": 7.202076007838515e+17,
9
+ "train_loss": 0.5288270854949951,
10
+ "train_runtime": 627.2045,
11
+ "train_samples_per_second": 52.854,
12
+ "train_steps_per_second": 0.159
13
+ }
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 33.38095238095238,
3
+ "eval_accuracy": 0.75,
4
+ "eval_loss": 0.7753319144248962,
5
+ "eval_runtime": 1.5195,
6
+ "eval_samples_per_second": 57.914,
7
+ "eval_steps_per_second": 1.974
8
+ }
runs/Feb10_00-33-52_e3629502e642/events.out.tfevents.1739148302.e3629502e642.30696.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d06d9efbfd8042d769faf6cbb900c57a9ad28059f56029046deb61d8fc17123
3
+ size 405
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 33.38095238095238,
3
+ "total_flos": 7.202076007838515e+17,
4
+ "train_loss": 0.5288270854949951,
5
+ "train_runtime": 627.2045,
6
+ "train_samples_per_second": 52.854,
7
+ "train_steps_per_second": 0.159
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,418 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.75,
3
+ "best_model_checkpoint": "swinv2-tiny-patch4-window8-256-dmae-humeda-DAV54/checkpoint-60",
4
+ "epoch": 33.38095238095238,
5
+ "eval_steps": 500,
6
+ "global_step": 100,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 1.0,
13
+ "eval_accuracy": 0.19318181818181818,
14
+ "eval_loss": 1.585249423980713,
15
+ "eval_runtime": 1.4912,
16
+ "eval_samples_per_second": 59.014,
17
+ "eval_steps_per_second": 2.012,
18
+ "step": 3
19
+ },
20
+ {
21
+ "epoch": 2.0,
22
+ "eval_accuracy": 0.3181818181818182,
23
+ "eval_loss": 1.578413486480713,
24
+ "eval_runtime": 1.5431,
25
+ "eval_samples_per_second": 57.028,
26
+ "eval_steps_per_second": 1.944,
27
+ "step": 6
28
+ },
29
+ {
30
+ "epoch": 3.0,
31
+ "eval_accuracy": 0.4318181818181818,
32
+ "eval_loss": 1.537353515625,
33
+ "eval_runtime": 1.5969,
34
+ "eval_samples_per_second": 55.107,
35
+ "eval_steps_per_second": 1.879,
36
+ "step": 9
37
+ },
38
+ {
39
+ "epoch": 3.380952380952381,
40
+ "grad_norm": 3.083775520324707,
41
+ "learning_rate": 5e-05,
42
+ "loss": 1.3768,
43
+ "step": 10
44
+ },
45
+ {
46
+ "epoch": 4.0,
47
+ "eval_accuracy": 0.4090909090909091,
48
+ "eval_loss": 1.4629433155059814,
49
+ "eval_runtime": 1.5346,
50
+ "eval_samples_per_second": 57.345,
51
+ "eval_steps_per_second": 1.955,
52
+ "step": 12
53
+ },
54
+ {
55
+ "epoch": 5.0,
56
+ "eval_accuracy": 0.5340909090909091,
57
+ "eval_loss": 1.2221930027008057,
58
+ "eval_runtime": 2.5597,
59
+ "eval_samples_per_second": 34.379,
60
+ "eval_steps_per_second": 1.172,
61
+ "step": 15
62
+ },
63
+ {
64
+ "epoch": 6.0,
65
+ "eval_accuracy": 0.5454545454545454,
66
+ "eval_loss": 1.2436859607696533,
67
+ "eval_runtime": 1.5399,
68
+ "eval_samples_per_second": 57.146,
69
+ "eval_steps_per_second": 1.948,
70
+ "step": 18
71
+ },
72
+ {
73
+ "epoch": 6.761904761904762,
74
+ "grad_norm": 4.605942249298096,
75
+ "learning_rate": 4.849231551964771e-05,
76
+ "loss": 0.942,
77
+ "step": 20
78
+ },
79
+ {
80
+ "epoch": 7.0,
81
+ "eval_accuracy": 0.5340909090909091,
82
+ "eval_loss": 1.242801308631897,
83
+ "eval_runtime": 1.5797,
84
+ "eval_samples_per_second": 55.707,
85
+ "eval_steps_per_second": 1.899,
86
+ "step": 21
87
+ },
88
+ {
89
+ "epoch": 8.0,
90
+ "eval_accuracy": 0.5340909090909091,
91
+ "eval_loss": 1.1750913858413696,
92
+ "eval_runtime": 2.5156,
93
+ "eval_samples_per_second": 34.982,
94
+ "eval_steps_per_second": 1.193,
95
+ "step": 24
96
+ },
97
+ {
98
+ "epoch": 9.0,
99
+ "eval_accuracy": 0.5795454545454546,
100
+ "eval_loss": 1.1278696060180664,
101
+ "eval_runtime": 2.3024,
102
+ "eval_samples_per_second": 38.222,
103
+ "eval_steps_per_second": 1.303,
104
+ "step": 27
105
+ },
106
+ {
107
+ "epoch": 10.0,
108
+ "grad_norm": 6.71976900100708,
109
+ "learning_rate": 4.415111107797445e-05,
110
+ "loss": 0.6265,
111
+ "step": 30
112
+ },
113
+ {
114
+ "epoch": 10.0,
115
+ "eval_accuracy": 0.6477272727272727,
116
+ "eval_loss": 0.9868423342704773,
117
+ "eval_runtime": 2.2207,
118
+ "eval_samples_per_second": 39.627,
119
+ "eval_steps_per_second": 1.351,
120
+ "step": 30
121
+ },
122
+ {
123
+ "epoch": 11.0,
124
+ "eval_accuracy": 0.6363636363636364,
125
+ "eval_loss": 0.9661000967025757,
126
+ "eval_runtime": 2.178,
127
+ "eval_samples_per_second": 40.404,
128
+ "eval_steps_per_second": 1.377,
129
+ "step": 33
130
+ },
131
+ {
132
+ "epoch": 12.0,
133
+ "eval_accuracy": 0.6136363636363636,
134
+ "eval_loss": 0.9892013669013977,
135
+ "eval_runtime": 2.2016,
136
+ "eval_samples_per_second": 39.97,
137
+ "eval_steps_per_second": 1.363,
138
+ "step": 36
139
+ },
140
+ {
141
+ "epoch": 13.0,
142
+ "eval_accuracy": 0.6818181818181818,
143
+ "eval_loss": 0.87156081199646,
144
+ "eval_runtime": 1.6274,
145
+ "eval_samples_per_second": 54.073,
146
+ "eval_steps_per_second": 1.843,
147
+ "step": 39
148
+ },
149
+ {
150
+ "epoch": 13.380952380952381,
151
+ "grad_norm": 6.5638837814331055,
152
+ "learning_rate": 3.7500000000000003e-05,
153
+ "loss": 0.5106,
154
+ "step": 40
155
+ },
156
+ {
157
+ "epoch": 14.0,
158
+ "eval_accuracy": 0.7272727272727273,
159
+ "eval_loss": 0.8009552359580994,
160
+ "eval_runtime": 1.5443,
161
+ "eval_samples_per_second": 56.984,
162
+ "eval_steps_per_second": 1.943,
163
+ "step": 42
164
+ },
165
+ {
166
+ "epoch": 15.0,
167
+ "eval_accuracy": 0.6818181818181818,
168
+ "eval_loss": 0.8596124053001404,
169
+ "eval_runtime": 1.5414,
170
+ "eval_samples_per_second": 57.091,
171
+ "eval_steps_per_second": 1.946,
172
+ "step": 45
173
+ },
174
+ {
175
+ "epoch": 16.0,
176
+ "eval_accuracy": 0.6931818181818182,
177
+ "eval_loss": 0.8257151246070862,
178
+ "eval_runtime": 2.2212,
179
+ "eval_samples_per_second": 39.619,
180
+ "eval_steps_per_second": 1.351,
181
+ "step": 48
182
+ },
183
+ {
184
+ "epoch": 16.761904761904763,
185
+ "grad_norm": 5.321930885314941,
186
+ "learning_rate": 2.9341204441673266e-05,
187
+ "loss": 0.4183,
188
+ "step": 50
189
+ },
190
+ {
191
+ "epoch": 17.0,
192
+ "eval_accuracy": 0.7045454545454546,
193
+ "eval_loss": 0.8189888000488281,
194
+ "eval_runtime": 1.5383,
195
+ "eval_samples_per_second": 57.207,
196
+ "eval_steps_per_second": 1.95,
197
+ "step": 51
198
+ },
199
+ {
200
+ "epoch": 18.0,
201
+ "eval_accuracy": 0.7272727272727273,
202
+ "eval_loss": 0.7627521753311157,
203
+ "eval_runtime": 2.2402,
204
+ "eval_samples_per_second": 39.283,
205
+ "eval_steps_per_second": 1.339,
206
+ "step": 54
207
+ },
208
+ {
209
+ "epoch": 19.0,
210
+ "eval_accuracy": 0.7159090909090909,
211
+ "eval_loss": 0.7801702618598938,
212
+ "eval_runtime": 2.2768,
213
+ "eval_samples_per_second": 38.651,
214
+ "eval_steps_per_second": 1.318,
215
+ "step": 57
216
+ },
217
+ {
218
+ "epoch": 20.0,
219
+ "grad_norm": 3.8304524421691895,
220
+ "learning_rate": 2.0658795558326743e-05,
221
+ "loss": 0.3267,
222
+ "step": 60
223
+ },
224
+ {
225
+ "epoch": 20.0,
226
+ "eval_accuracy": 0.75,
227
+ "eval_loss": 0.7753319144248962,
228
+ "eval_runtime": 2.3302,
229
+ "eval_samples_per_second": 37.766,
230
+ "eval_steps_per_second": 1.287,
231
+ "step": 60
232
+ },
233
+ {
234
+ "epoch": 21.0,
235
+ "eval_accuracy": 0.7386363636363636,
236
+ "eval_loss": 0.7770728468894958,
237
+ "eval_runtime": 2.2672,
238
+ "eval_samples_per_second": 38.815,
239
+ "eval_steps_per_second": 1.323,
240
+ "step": 63
241
+ },
242
+ {
243
+ "epoch": 22.0,
244
+ "eval_accuracy": 0.75,
245
+ "eval_loss": 0.7770181894302368,
246
+ "eval_runtime": 2.3268,
247
+ "eval_samples_per_second": 37.821,
248
+ "eval_steps_per_second": 1.289,
249
+ "step": 66
250
+ },
251
+ {
252
+ "epoch": 23.0,
253
+ "eval_accuracy": 0.7272727272727273,
254
+ "eval_loss": 0.7940635681152344,
255
+ "eval_runtime": 2.2104,
256
+ "eval_samples_per_second": 39.812,
257
+ "eval_steps_per_second": 1.357,
258
+ "step": 69
259
+ },
260
+ {
261
+ "epoch": 23.38095238095238,
262
+ "grad_norm": 5.505289077758789,
263
+ "learning_rate": 1.2500000000000006e-05,
264
+ "loss": 0.3008,
265
+ "step": 70
266
+ },
267
+ {
268
+ "epoch": 24.0,
269
+ "eval_accuracy": 0.7272727272727273,
270
+ "eval_loss": 0.7921419739723206,
271
+ "eval_runtime": 2.1726,
272
+ "eval_samples_per_second": 40.505,
273
+ "eval_steps_per_second": 1.381,
274
+ "step": 72
275
+ },
276
+ {
277
+ "epoch": 25.0,
278
+ "eval_accuracy": 0.7386363636363636,
279
+ "eval_loss": 0.7899277210235596,
280
+ "eval_runtime": 2.2223,
281
+ "eval_samples_per_second": 39.599,
282
+ "eval_steps_per_second": 1.35,
283
+ "step": 75
284
+ },
285
+ {
286
+ "epoch": 26.0,
287
+ "eval_accuracy": 0.75,
288
+ "eval_loss": 0.7849180698394775,
289
+ "eval_runtime": 2.1648,
290
+ "eval_samples_per_second": 40.65,
291
+ "eval_steps_per_second": 1.386,
292
+ "step": 78
293
+ },
294
+ {
295
+ "epoch": 26.761904761904763,
296
+ "grad_norm": 5.414725303649902,
297
+ "learning_rate": 5.848888922025553e-06,
298
+ "loss": 0.2795,
299
+ "step": 80
300
+ },
301
+ {
302
+ "epoch": 27.0,
303
+ "eval_accuracy": 0.75,
304
+ "eval_loss": 0.7891153693199158,
305
+ "eval_runtime": 2.2542,
306
+ "eval_samples_per_second": 39.038,
307
+ "eval_steps_per_second": 1.331,
308
+ "step": 81
309
+ },
310
+ {
311
+ "epoch": 28.0,
312
+ "eval_accuracy": 0.7386363636363636,
313
+ "eval_loss": 0.7973006963729858,
314
+ "eval_runtime": 2.205,
315
+ "eval_samples_per_second": 39.909,
316
+ "eval_steps_per_second": 1.361,
317
+ "step": 84
318
+ },
319
+ {
320
+ "epoch": 29.0,
321
+ "eval_accuracy": 0.7386363636363636,
322
+ "eval_loss": 0.8067693710327148,
323
+ "eval_runtime": 2.1816,
324
+ "eval_samples_per_second": 40.338,
325
+ "eval_steps_per_second": 1.375,
326
+ "step": 87
327
+ },
328
+ {
329
+ "epoch": 30.0,
330
+ "grad_norm": 4.411905765533447,
331
+ "learning_rate": 1.5076844803522922e-06,
332
+ "loss": 0.2526,
333
+ "step": 90
334
+ },
335
+ {
336
+ "epoch": 30.0,
337
+ "eval_accuracy": 0.7386363636363636,
338
+ "eval_loss": 0.8087642788887024,
339
+ "eval_runtime": 1.5036,
340
+ "eval_samples_per_second": 58.526,
341
+ "eval_steps_per_second": 1.995,
342
+ "step": 90
343
+ },
344
+ {
345
+ "epoch": 31.0,
346
+ "eval_accuracy": 0.7386363636363636,
347
+ "eval_loss": 0.8097642660140991,
348
+ "eval_runtime": 1.8153,
349
+ "eval_samples_per_second": 48.476,
350
+ "eval_steps_per_second": 1.653,
351
+ "step": 93
352
+ },
353
+ {
354
+ "epoch": 32.0,
355
+ "eval_accuracy": 0.7386363636363636,
356
+ "eval_loss": 0.8095622658729553,
357
+ "eval_runtime": 1.82,
358
+ "eval_samples_per_second": 48.352,
359
+ "eval_steps_per_second": 1.648,
360
+ "step": 96
361
+ },
362
+ {
363
+ "epoch": 33.0,
364
+ "eval_accuracy": 0.7386363636363636,
365
+ "eval_loss": 0.8095269799232483,
366
+ "eval_runtime": 1.7559,
367
+ "eval_samples_per_second": 50.118,
368
+ "eval_steps_per_second": 1.709,
369
+ "step": 99
370
+ },
371
+ {
372
+ "epoch": 33.38095238095238,
373
+ "grad_norm": 5.03811502456665,
374
+ "learning_rate": 0.0,
375
+ "loss": 0.2544,
376
+ "step": 100
377
+ },
378
+ {
379
+ "epoch": 33.38095238095238,
380
+ "eval_accuracy": 0.7386363636363636,
381
+ "eval_loss": 0.8093982338905334,
382
+ "eval_runtime": 1.7511,
383
+ "eval_samples_per_second": 50.253,
384
+ "eval_steps_per_second": 1.713,
385
+ "step": 100
386
+ },
387
+ {
388
+ "epoch": 33.38095238095238,
389
+ "step": 100,
390
+ "total_flos": 7.202076007838515e+17,
391
+ "train_loss": 0.5288270854949951,
392
+ "train_runtime": 627.2045,
393
+ "train_samples_per_second": 52.854,
394
+ "train_steps_per_second": 0.159
395
+ }
396
+ ],
397
+ "logging_steps": 10,
398
+ "max_steps": 100,
399
+ "num_input_tokens_seen": 0,
400
+ "num_train_epochs": 50,
401
+ "save_steps": 500,
402
+ "stateful_callbacks": {
403
+ "TrainerControl": {
404
+ "args": {
405
+ "should_epoch_stop": false,
406
+ "should_evaluate": false,
407
+ "should_log": false,
408
+ "should_save": true,
409
+ "should_training_stop": true
410
+ },
411
+ "attributes": {}
412
+ }
413
+ },
414
+ "total_flos": 7.202076007838515e+17,
415
+ "train_batch_size": 32,
416
+ "trial_name": null,
417
+ "trial_params": null
418
+ }