Augusto777 commited on
Commit
d0af476
·
verified ·
1 Parent(s): 1d6e616

End of training

Browse files
README.md CHANGED
@@ -22,7 +22,7 @@ model-index:
22
  metrics:
23
  - name: Accuracy
24
  type: accuracy
25
- value: 0.7647058823529411
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -32,8 +32,8 @@ should probably proofread and complete it, then remove this comment. -->
32
 
33
  This model is a fine-tuned version of [google/vit-base-patch16-224](https://huggingface.co/google/vit-base-patch16-224) on the imagefolder dataset.
34
  It achieves the following results on the evaluation set:
35
- - Loss: 0.7772
36
- - Accuracy: 0.7647
37
 
38
  ## Model description
39
 
 
22
  metrics:
23
  - name: Accuracy
24
  type: accuracy
25
+ value: 0.8431372549019608
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
32
 
33
  This model is a fine-tuned version of [google/vit-base-patch16-224](https://huggingface.co/google/vit-base-patch16-224) on the imagefolder dataset.
34
  It achieves the following results on the evaluation set:
35
+ - Loss: 0.6158
36
+ - Accuracy: 0.8431
37
 
38
  ## Model description
39
 
all_results.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 22.69,
3
+ "eval_accuracy": 0.8431372549019608,
4
+ "eval_loss": 0.6158193945884705,
5
+ "eval_runtime": 1.0507,
6
+ "eval_samples_per_second": 48.54,
7
+ "eval_steps_per_second": 1.904,
8
+ "train_loss": 0.3522763775709348,
9
+ "train_runtime": 628.612,
10
+ "train_samples_per_second": 66.776,
11
+ "train_steps_per_second": 0.496
12
+ }
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 22.69,
3
+ "eval_accuracy": 0.8431372549019608,
4
+ "eval_loss": 0.6158193945884705,
5
+ "eval_runtime": 1.0507,
6
+ "eval_samples_per_second": 48.54,
7
+ "eval_steps_per_second": 1.904
8
+ }
runs/Jun10_10-19-01_DESKTOP-SKBE9FB/events.out.tfevents.1718037065.DESKTOP-SKBE9FB.8944.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0f46763d311f31391244b9611831f5fa01cf1a23adfbf4a36abae538d8c917a
3
+ size 411
train_results.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 22.69,
3
+ "train_loss": 0.3522763775709348,
4
+ "train_runtime": 628.612,
5
+ "train_samples_per_second": 66.776,
6
+ "train_steps_per_second": 0.496
7
+ }
trainer_state.json ADDED
@@ -0,0 +1,423 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.8431372549019608,
3
+ "best_model_checkpoint": "vit-base-patch16-224-RXL1-24\\checkpoint-96",
4
+ "epoch": 22.69090909090909,
5
+ "eval_steps": 500,
6
+ "global_step": 312,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.73,
13
+ "learning_rate": 3.4375e-05,
14
+ "loss": 1.3745,
15
+ "step": 10
16
+ },
17
+ {
18
+ "epoch": 0.95,
19
+ "eval_accuracy": 0.47058823529411764,
20
+ "eval_loss": 1.3056340217590332,
21
+ "eval_runtime": 0.7424,
22
+ "eval_samples_per_second": 68.693,
23
+ "eval_steps_per_second": 2.694,
24
+ "step": 13
25
+ },
26
+ {
27
+ "epoch": 1.45,
28
+ "learning_rate": 5.4256756756756764e-05,
29
+ "loss": 1.2896,
30
+ "step": 20
31
+ },
32
+ {
33
+ "epoch": 1.96,
34
+ "eval_accuracy": 0.6470588235294118,
35
+ "eval_loss": 1.103859543800354,
36
+ "eval_runtime": 0.7848,
37
+ "eval_samples_per_second": 64.988,
38
+ "eval_steps_per_second": 2.549,
39
+ "step": 27
40
+ },
41
+ {
42
+ "epoch": 2.18,
43
+ "learning_rate": 5.239864864864865e-05,
44
+ "loss": 1.1563,
45
+ "step": 30
46
+ },
47
+ {
48
+ "epoch": 2.91,
49
+ "learning_rate": 5.0540540540540544e-05,
50
+ "loss": 0.9896,
51
+ "step": 40
52
+ },
53
+ {
54
+ "epoch": 2.98,
55
+ "eval_accuracy": 0.6470588235294118,
56
+ "eval_loss": 0.9412985444068909,
57
+ "eval_runtime": 0.7684,
58
+ "eval_samples_per_second": 66.368,
59
+ "eval_steps_per_second": 2.603,
60
+ "step": 41
61
+ },
62
+ {
63
+ "epoch": 3.64,
64
+ "learning_rate": 4.868243243243243e-05,
65
+ "loss": 0.8472,
66
+ "step": 50
67
+ },
68
+ {
69
+ "epoch": 4.0,
70
+ "eval_accuracy": 0.6274509803921569,
71
+ "eval_loss": 0.905930757522583,
72
+ "eval_runtime": 0.7968,
73
+ "eval_samples_per_second": 64.003,
74
+ "eval_steps_per_second": 2.51,
75
+ "step": 55
76
+ },
77
+ {
78
+ "epoch": 4.36,
79
+ "learning_rate": 4.6824324324324325e-05,
80
+ "loss": 0.7375,
81
+ "step": 60
82
+ },
83
+ {
84
+ "epoch": 4.95,
85
+ "eval_accuracy": 0.803921568627451,
86
+ "eval_loss": 0.6519917249679565,
87
+ "eval_runtime": 0.822,
88
+ "eval_samples_per_second": 62.047,
89
+ "eval_steps_per_second": 2.433,
90
+ "step": 68
91
+ },
92
+ {
93
+ "epoch": 5.09,
94
+ "learning_rate": 4.496621621621622e-05,
95
+ "loss": 0.5786,
96
+ "step": 70
97
+ },
98
+ {
99
+ "epoch": 5.82,
100
+ "learning_rate": 4.3108108108108106e-05,
101
+ "loss": 0.458,
102
+ "step": 80
103
+ },
104
+ {
105
+ "epoch": 5.96,
106
+ "eval_accuracy": 0.803921568627451,
107
+ "eval_loss": 0.6753640174865723,
108
+ "eval_runtime": 0.8618,
109
+ "eval_samples_per_second": 59.178,
110
+ "eval_steps_per_second": 2.321,
111
+ "step": 82
112
+ },
113
+ {
114
+ "epoch": 6.55,
115
+ "learning_rate": 4.125e-05,
116
+ "loss": 0.3807,
117
+ "step": 90
118
+ },
119
+ {
120
+ "epoch": 6.98,
121
+ "eval_accuracy": 0.8431372549019608,
122
+ "eval_loss": 0.6158193945884705,
123
+ "eval_runtime": 0.7813,
124
+ "eval_samples_per_second": 65.275,
125
+ "eval_steps_per_second": 2.56,
126
+ "step": 96
127
+ },
128
+ {
129
+ "epoch": 7.27,
130
+ "learning_rate": 3.9391891891891894e-05,
131
+ "loss": 0.3282,
132
+ "step": 100
133
+ },
134
+ {
135
+ "epoch": 8.0,
136
+ "learning_rate": 3.753378378378379e-05,
137
+ "loss": 0.3003,
138
+ "step": 110
139
+ },
140
+ {
141
+ "epoch": 8.0,
142
+ "eval_accuracy": 0.803921568627451,
143
+ "eval_loss": 0.5665538311004639,
144
+ "eval_runtime": 0.7924,
145
+ "eval_samples_per_second": 64.358,
146
+ "eval_steps_per_second": 2.524,
147
+ "step": 110
148
+ },
149
+ {
150
+ "epoch": 8.73,
151
+ "learning_rate": 3.567567567567568e-05,
152
+ "loss": 0.2337,
153
+ "step": 120
154
+ },
155
+ {
156
+ "epoch": 8.95,
157
+ "eval_accuracy": 0.803921568627451,
158
+ "eval_loss": 0.5409361124038696,
159
+ "eval_runtime": 0.8091,
160
+ "eval_samples_per_second": 63.033,
161
+ "eval_steps_per_second": 2.472,
162
+ "step": 123
163
+ },
164
+ {
165
+ "epoch": 9.45,
166
+ "learning_rate": 3.381756756756757e-05,
167
+ "loss": 0.2252,
168
+ "step": 130
169
+ },
170
+ {
171
+ "epoch": 9.96,
172
+ "eval_accuracy": 0.7647058823529411,
173
+ "eval_loss": 0.7381905913352966,
174
+ "eval_runtime": 0.8081,
175
+ "eval_samples_per_second": 63.11,
176
+ "eval_steps_per_second": 2.475,
177
+ "step": 137
178
+ },
179
+ {
180
+ "epoch": 10.18,
181
+ "learning_rate": 3.1959459459459455e-05,
182
+ "loss": 0.1952,
183
+ "step": 140
184
+ },
185
+ {
186
+ "epoch": 10.91,
187
+ "learning_rate": 3.010135135135135e-05,
188
+ "loss": 0.1644,
189
+ "step": 150
190
+ },
191
+ {
192
+ "epoch": 10.98,
193
+ "eval_accuracy": 0.803921568627451,
194
+ "eval_loss": 0.6363002061843872,
195
+ "eval_runtime": 0.7874,
196
+ "eval_samples_per_second": 64.774,
197
+ "eval_steps_per_second": 2.54,
198
+ "step": 151
199
+ },
200
+ {
201
+ "epoch": 11.64,
202
+ "learning_rate": 2.8243243243243243e-05,
203
+ "loss": 0.1608,
204
+ "step": 160
205
+ },
206
+ {
207
+ "epoch": 12.0,
208
+ "eval_accuracy": 0.803921568627451,
209
+ "eval_loss": 0.6941252946853638,
210
+ "eval_runtime": 0.809,
211
+ "eval_samples_per_second": 63.04,
212
+ "eval_steps_per_second": 2.472,
213
+ "step": 165
214
+ },
215
+ {
216
+ "epoch": 12.36,
217
+ "learning_rate": 2.6385135135135137e-05,
218
+ "loss": 0.1354,
219
+ "step": 170
220
+ },
221
+ {
222
+ "epoch": 12.95,
223
+ "eval_accuracy": 0.7843137254901961,
224
+ "eval_loss": 0.6985132694244385,
225
+ "eval_runtime": 0.7967,
226
+ "eval_samples_per_second": 64.012,
227
+ "eval_steps_per_second": 2.51,
228
+ "step": 178
229
+ },
230
+ {
231
+ "epoch": 13.09,
232
+ "learning_rate": 2.4527027027027027e-05,
233
+ "loss": 0.1287,
234
+ "step": 180
235
+ },
236
+ {
237
+ "epoch": 13.82,
238
+ "learning_rate": 2.266891891891892e-05,
239
+ "loss": 0.1298,
240
+ "step": 190
241
+ },
242
+ {
243
+ "epoch": 13.96,
244
+ "eval_accuracy": 0.803921568627451,
245
+ "eval_loss": 0.6610224843025208,
246
+ "eval_runtime": 0.8038,
247
+ "eval_samples_per_second": 63.446,
248
+ "eval_steps_per_second": 2.488,
249
+ "step": 192
250
+ },
251
+ {
252
+ "epoch": 14.55,
253
+ "learning_rate": 2.081081081081081e-05,
254
+ "loss": 0.1333,
255
+ "step": 200
256
+ },
257
+ {
258
+ "epoch": 14.98,
259
+ "eval_accuracy": 0.803921568627451,
260
+ "eval_loss": 0.675108015537262,
261
+ "eval_runtime": 0.7776,
262
+ "eval_samples_per_second": 65.588,
263
+ "eval_steps_per_second": 2.572,
264
+ "step": 206
265
+ },
266
+ {
267
+ "epoch": 15.27,
268
+ "learning_rate": 1.89527027027027e-05,
269
+ "loss": 0.1241,
270
+ "step": 210
271
+ },
272
+ {
273
+ "epoch": 16.0,
274
+ "learning_rate": 1.7094594594594595e-05,
275
+ "loss": 0.1209,
276
+ "step": 220
277
+ },
278
+ {
279
+ "epoch": 16.0,
280
+ "eval_accuracy": 0.7843137254901961,
281
+ "eval_loss": 0.7722602486610413,
282
+ "eval_runtime": 0.7727,
283
+ "eval_samples_per_second": 66.007,
284
+ "eval_steps_per_second": 2.588,
285
+ "step": 220
286
+ },
287
+ {
288
+ "epoch": 16.73,
289
+ "learning_rate": 1.5236486486486487e-05,
290
+ "loss": 0.1057,
291
+ "step": 230
292
+ },
293
+ {
294
+ "epoch": 16.95,
295
+ "eval_accuracy": 0.7254901960784313,
296
+ "eval_loss": 0.8037699460983276,
297
+ "eval_runtime": 0.7639,
298
+ "eval_samples_per_second": 66.761,
299
+ "eval_steps_per_second": 2.618,
300
+ "step": 233
301
+ },
302
+ {
303
+ "epoch": 17.45,
304
+ "learning_rate": 1.337837837837838e-05,
305
+ "loss": 0.0972,
306
+ "step": 240
307
+ },
308
+ {
309
+ "epoch": 17.96,
310
+ "eval_accuracy": 0.7647058823529411,
311
+ "eval_loss": 0.8375279307365417,
312
+ "eval_runtime": 0.7813,
313
+ "eval_samples_per_second": 65.279,
314
+ "eval_steps_per_second": 2.56,
315
+ "step": 247
316
+ },
317
+ {
318
+ "epoch": 18.18,
319
+ "learning_rate": 1.152027027027027e-05,
320
+ "loss": 0.0974,
321
+ "step": 250
322
+ },
323
+ {
324
+ "epoch": 18.91,
325
+ "learning_rate": 9.662162162162164e-06,
326
+ "loss": 0.0789,
327
+ "step": 260
328
+ },
329
+ {
330
+ "epoch": 18.98,
331
+ "eval_accuracy": 0.8235294117647058,
332
+ "eval_loss": 0.697125256061554,
333
+ "eval_runtime": 0.8068,
334
+ "eval_samples_per_second": 63.21,
335
+ "eval_steps_per_second": 2.479,
336
+ "step": 261
337
+ },
338
+ {
339
+ "epoch": 19.64,
340
+ "learning_rate": 7.804054054054054e-06,
341
+ "loss": 0.0833,
342
+ "step": 270
343
+ },
344
+ {
345
+ "epoch": 20.0,
346
+ "eval_accuracy": 0.7843137254901961,
347
+ "eval_loss": 0.7507321238517761,
348
+ "eval_runtime": 0.8032,
349
+ "eval_samples_per_second": 63.499,
350
+ "eval_steps_per_second": 2.49,
351
+ "step": 275
352
+ },
353
+ {
354
+ "epoch": 20.36,
355
+ "learning_rate": 5.945945945945946e-06,
356
+ "loss": 0.0813,
357
+ "step": 280
358
+ },
359
+ {
360
+ "epoch": 20.95,
361
+ "eval_accuracy": 0.7843137254901961,
362
+ "eval_loss": 0.7085339426994324,
363
+ "eval_runtime": 0.7675,
364
+ "eval_samples_per_second": 66.445,
365
+ "eval_steps_per_second": 2.606,
366
+ "step": 288
367
+ },
368
+ {
369
+ "epoch": 21.09,
370
+ "learning_rate": 4.087837837837838e-06,
371
+ "loss": 0.0874,
372
+ "step": 290
373
+ },
374
+ {
375
+ "epoch": 21.82,
376
+ "learning_rate": 2.22972972972973e-06,
377
+ "loss": 0.0803,
378
+ "step": 300
379
+ },
380
+ {
381
+ "epoch": 21.96,
382
+ "eval_accuracy": 0.7647058823529411,
383
+ "eval_loss": 0.7565922737121582,
384
+ "eval_runtime": 0.8044,
385
+ "eval_samples_per_second": 63.404,
386
+ "eval_steps_per_second": 2.486,
387
+ "step": 302
388
+ },
389
+ {
390
+ "epoch": 22.55,
391
+ "learning_rate": 3.7162162162162164e-07,
392
+ "loss": 0.0693,
393
+ "step": 310
394
+ },
395
+ {
396
+ "epoch": 22.69,
397
+ "eval_accuracy": 0.7647058823529411,
398
+ "eval_loss": 0.7772119045257568,
399
+ "eval_runtime": 0.7864,
400
+ "eval_samples_per_second": 64.855,
401
+ "eval_steps_per_second": 2.543,
402
+ "step": 312
403
+ },
404
+ {
405
+ "epoch": 22.69,
406
+ "step": 312,
407
+ "total_flos": 3.0760221736008253e+18,
408
+ "train_loss": 0.3522763775709348,
409
+ "train_runtime": 628.612,
410
+ "train_samples_per_second": 66.776,
411
+ "train_steps_per_second": 0.496
412
+ }
413
+ ],
414
+ "logging_steps": 10,
415
+ "max_steps": 312,
416
+ "num_input_tokens_seen": 0,
417
+ "num_train_epochs": 24,
418
+ "save_steps": 500,
419
+ "total_flos": 3.0760221736008253e+18,
420
+ "train_batch_size": 32,
421
+ "trial_name": null,
422
+ "trial_params": null
423
+ }