SodaXII commited on
Commit
7959889
·
verified ·
1 Parent(s): 6b4e51a

Model save

Browse files
README.md CHANGED
@@ -4,6 +4,8 @@ license: apache-2.0
4
  base_model: google/vit-base-patch16-224
5
  tags:
6
  - generated_from_trainer
 
 
7
  model-index:
8
  - name: vit-base-patch16-224_rice-leaf-disease-augmented-v2_fft
9
  results: []
@@ -16,13 +18,8 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  This model is a fine-tuned version of [google/vit-base-patch16-224](https://huggingface.co/google/vit-base-patch16-224) on an unknown dataset.
18
  It achieves the following results on the evaluation set:
19
- - epoch: 18.0
20
- - eval_accuracy: 0.9196
21
- - eval_loss: 0.3620
22
- - eval_runtime: 11.0713
23
- - eval_samples_per_second: 30.349
24
- - eval_steps_per_second: 0.542
25
- - step: 2250
26
 
27
  ## Model description
28
 
@@ -51,6 +48,30 @@ The following hyperparameters were used during training:
51
  - num_epochs: 15
52
  - mixed_precision_training: Native AMP
53
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
54
  ### Framework versions
55
 
56
  - Transformers 4.48.3
 
4
  base_model: google/vit-base-patch16-224
5
  tags:
6
  - generated_from_trainer
7
+ metrics:
8
+ - accuracy
9
  model-index:
10
  - name: vit-base-patch16-224_rice-leaf-disease-augmented-v2_fft
11
  results: []
 
18
 
19
  This model is a fine-tuned version of [google/vit-base-patch16-224](https://huggingface.co/google/vit-base-patch16-224) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
+ - Accuracy: 0.9196
22
+ - Loss: 0.3620
 
 
 
 
 
23
 
24
  ## Model description
25
 
 
48
  - num_epochs: 15
49
  - mixed_precision_training: Native AMP
50
 
51
+ ### Training results
52
+
53
+ | Training Loss | Epoch | Step | Accuracy | Validation Loss |
54
+ |:-------------:|:-----:|:----:|:--------:|:---------------:|
55
+ | 1.9482 | 1.0 | 125 | 0.5685 | 1.5012 |
56
+ | 0.9894 | 2.0 | 250 | 0.7976 | 0.6444 |
57
+ | 0.3321 | 3.0 | 375 | 0.8958 | 0.3859 |
58
+ | 0.1115 | 4.0 | 500 | 0.9107 | 0.3081 |
59
+ | 0.0387 | 5.0 | 625 | 0.9137 | 0.2980 |
60
+ | 0.0204 | 6.0 | 750 | 0.9137 | 0.2936 |
61
+ | 0.0169 | 7.0 | 875 | 0.9196 | 0.2953 |
62
+ | 0.0078 | 8.0 | 1000 | 0.9226 | 0.3067 |
63
+ | 0.0034 | 9.0 | 1125 | 0.9286 | 0.3087 |
64
+ | 0.0025 | 10.0 | 1250 | 0.9196 | 0.3139 |
65
+ | 0.0023 | 11.0 | 1375 | 0.9196 | 0.3142 |
66
+ | 0.0019 | 12.0 | 1500 | 0.9196 | 0.3288 |
67
+ | 0.0013 | 13.0 | 1625 | 0.9196 | 0.3359 |
68
+ | 0.001 | 14.0 | 1750 | 0.9226 | 0.3413 |
69
+ | 0.0009 | 15.0 | 1875 | 0.9226 | 0.3425 |
70
+ | 0.0009 | 16.0 | 2000 | 0.9226 | 0.3481 |
71
+ | 0.0007 | 17.0 | 2125 | 0.9226 | 0.3571 |
72
+ | 0.0006 | 18.0 | 2250 | 0.9196 | 0.3620 |
73
+
74
+
75
  ### Framework versions
76
 
77
  - Transformers 4.48.3
logs/events.out.tfevents.1740444395.4a8a76f3e68a.1955.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fa79a1d4ec4bca93aaf1b6810cbf2efcad36d9606487ce3e1c783c4f1bf89cc2
3
- size 88
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:665349651650707fd38cbf97bd56fc049951be360fcfe9126e5e5ef8a0229fa4
3
+ size 6021
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7ccfeb9fcbfcb69bb1dd3f91ab957cedb45851be3c8d25ba88c6576bc370a613
3
  size 343242432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e45518fd16a0cfc3f3db29de59fd516f8807a340ff671f0c2bd29aa81adca17
3
  size 343242432
trainer_state.json CHANGED
@@ -1,17 +1,306 @@
1
  {
2
- "best_metric": null,
3
- "best_model_checkpoint": null,
4
- "epoch": 0,
5
  "eval_steps": 500,
6
- "global_step": 0,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
- "log_history": [],
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
11
  "logging_steps": 500,
12
- "max_steps": 2500,
13
  "num_input_tokens_seen": 0,
14
- "num_train_epochs": 20,
15
  "save_steps": 500,
16
  "stateful_callbacks": {
17
  "TrainerControl": {
@@ -19,13 +308,13 @@
19
  "should_epoch_stop": false,
20
  "should_evaluate": false,
21
  "should_log": false,
22
- "should_save": false,
23
  "should_training_stop": false
24
  },
25
  "attributes": {}
26
  }
27
  },
28
- "total_flos": 0,
29
  "train_batch_size": 64,
30
  "trial_name": null,
31
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.29358136653900146,
3
+ "best_model_checkpoint": "./drive/Shareddrives/CS198-Drones/training_output/vit-base-patch16-224_rice-leaf-disease-augmented-v2_fft/checkpoint-750",
4
+ "epoch": 18.0,
5
  "eval_steps": 500,
6
+ "global_step": 2250,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 1.0,
13
+ "grad_norm": 3.8496286869049072,
14
+ "learning_rate": 5e-06,
15
+ "loss": 1.9482,
16
+ "step": 125
17
+ },
18
+ {
19
+ "epoch": 1.0,
20
+ "eval_accuracy": 0.5684523809523809,
21
+ "eval_loss": 1.5012105703353882,
22
+ "eval_runtime": 11.0652,
23
+ "eval_samples_per_second": 30.365,
24
+ "eval_steps_per_second": 0.542,
25
+ "step": 125
26
+ },
27
+ {
28
+ "epoch": 2.0,
29
+ "grad_norm": 3.772235155105591,
30
+ "learning_rate": 1e-05,
31
+ "loss": 0.9894,
32
+ "step": 250
33
+ },
34
+ {
35
+ "epoch": 2.0,
36
+ "eval_accuracy": 0.7976190476190477,
37
+ "eval_loss": 0.6444453001022339,
38
+ "eval_runtime": 11.0129,
39
+ "eval_samples_per_second": 30.51,
40
+ "eval_steps_per_second": 0.545,
41
+ "step": 250
42
+ },
43
+ {
44
+ "epoch": 3.0,
45
+ "grad_norm": 1.4745649099349976,
46
+ "learning_rate": 8.83022221559489e-06,
47
+ "loss": 0.3321,
48
+ "step": 375
49
+ },
50
+ {
51
+ "epoch": 3.0,
52
+ "eval_accuracy": 0.8958333333333334,
53
+ "eval_loss": 0.3858731687068939,
54
+ "eval_runtime": 10.958,
55
+ "eval_samples_per_second": 30.663,
56
+ "eval_steps_per_second": 0.548,
57
+ "step": 375
58
+ },
59
+ {
60
+ "epoch": 4.0,
61
+ "grad_norm": 1.1253288984298706,
62
+ "learning_rate": 5.8682408883346535e-06,
63
+ "loss": 0.1115,
64
+ "step": 500
65
+ },
66
+ {
67
+ "epoch": 4.0,
68
+ "eval_accuracy": 0.9107142857142857,
69
+ "eval_loss": 0.3080737888813019,
70
+ "eval_runtime": 10.9888,
71
+ "eval_samples_per_second": 30.577,
72
+ "eval_steps_per_second": 0.546,
73
+ "step": 500
74
+ },
75
+ {
76
+ "epoch": 5.0,
77
+ "grad_norm": 0.3589422404766083,
78
+ "learning_rate": 2.5000000000000015e-06,
79
+ "loss": 0.0387,
80
+ "step": 625
81
+ },
82
+ {
83
+ "epoch": 5.0,
84
+ "eval_accuracy": 0.9136904761904762,
85
+ "eval_loss": 0.2979942262172699,
86
+ "eval_runtime": 11.1535,
87
+ "eval_samples_per_second": 30.125,
88
+ "eval_steps_per_second": 0.538,
89
+ "step": 625
90
+ },
91
+ {
92
+ "epoch": 6.0,
93
+ "grad_norm": 0.2502361536026001,
94
+ "learning_rate": 3.015368960704584e-07,
95
+ "loss": 0.0204,
96
+ "step": 750
97
+ },
98
+ {
99
+ "epoch": 6.0,
100
+ "eval_accuracy": 0.9136904761904762,
101
+ "eval_loss": 0.29358136653900146,
102
+ "eval_runtime": 11.1371,
103
+ "eval_samples_per_second": 30.169,
104
+ "eval_steps_per_second": 0.539,
105
+ "step": 750
106
+ },
107
+ {
108
+ "epoch": 7.0,
109
+ "grad_norm": 0.5141955018043518,
110
+ "learning_rate": 9.698463103929542e-06,
111
+ "loss": 0.0169,
112
+ "step": 875
113
+ },
114
+ {
115
+ "epoch": 7.0,
116
+ "eval_accuracy": 0.9196428571428571,
117
+ "eval_loss": 0.2952845096588135,
118
+ "eval_runtime": 11.0115,
119
+ "eval_samples_per_second": 30.513,
120
+ "eval_steps_per_second": 0.545,
121
+ "step": 875
122
+ },
123
+ {
124
+ "epoch": 8.0,
125
+ "grad_norm": 0.1391526609659195,
126
+ "learning_rate": 7.500000000000003e-06,
127
+ "loss": 0.0078,
128
+ "step": 1000
129
+ },
130
+ {
131
+ "epoch": 8.0,
132
+ "eval_accuracy": 0.9226190476190477,
133
+ "eval_loss": 0.3067362606525421,
134
+ "eval_runtime": 11.2875,
135
+ "eval_samples_per_second": 29.767,
136
+ "eval_steps_per_second": 0.532,
137
+ "step": 1000
138
+ },
139
+ {
140
+ "epoch": 9.0,
141
+ "grad_norm": 0.06930585205554962,
142
+ "learning_rate": 4.131759111665349e-06,
143
+ "loss": 0.0034,
144
+ "step": 1125
145
+ },
146
+ {
147
+ "epoch": 9.0,
148
+ "eval_accuracy": 0.9285714285714286,
149
+ "eval_loss": 0.3087221682071686,
150
+ "eval_runtime": 10.9679,
151
+ "eval_samples_per_second": 30.635,
152
+ "eval_steps_per_second": 0.547,
153
+ "step": 1125
154
+ },
155
+ {
156
+ "epoch": 10.0,
157
+ "grad_norm": 0.09097771346569061,
158
+ "learning_rate": 1.1697777844051105e-06,
159
+ "loss": 0.0025,
160
+ "step": 1250
161
+ },
162
+ {
163
+ "epoch": 10.0,
164
+ "eval_accuracy": 0.9196428571428571,
165
+ "eval_loss": 0.3138602674007416,
166
+ "eval_runtime": 10.3394,
167
+ "eval_samples_per_second": 32.497,
168
+ "eval_steps_per_second": 0.58,
169
+ "step": 1250
170
+ },
171
+ {
172
+ "epoch": 11.0,
173
+ "grad_norm": 0.06938016414642334,
174
+ "learning_rate": 1e-05,
175
+ "loss": 0.0023,
176
+ "step": 1375
177
+ },
178
+ {
179
+ "epoch": 11.0,
180
+ "eval_accuracy": 0.9196428571428571,
181
+ "eval_loss": 0.3141930401325226,
182
+ "eval_runtime": 10.7534,
183
+ "eval_samples_per_second": 31.246,
184
+ "eval_steps_per_second": 0.558,
185
+ "step": 1375
186
+ },
187
+ {
188
+ "epoch": 12.0,
189
+ "grad_norm": 0.04166670888662338,
190
+ "learning_rate": 8.83022221559489e-06,
191
+ "loss": 0.0019,
192
+ "step": 1500
193
+ },
194
+ {
195
+ "epoch": 12.0,
196
+ "eval_accuracy": 0.9196428571428571,
197
+ "eval_loss": 0.3288079798221588,
198
+ "eval_runtime": 10.8781,
199
+ "eval_samples_per_second": 30.888,
200
+ "eval_steps_per_second": 0.552,
201
+ "step": 1500
202
+ },
203
+ {
204
+ "epoch": 13.0,
205
+ "grad_norm": 0.04881810024380684,
206
+ "learning_rate": 5.86824088833465e-06,
207
+ "loss": 0.0013,
208
+ "step": 1625
209
+ },
210
+ {
211
+ "epoch": 13.0,
212
+ "eval_accuracy": 0.9196428571428571,
213
+ "eval_loss": 0.33594179153442383,
214
+ "eval_runtime": 11.2397,
215
+ "eval_samples_per_second": 29.894,
216
+ "eval_steps_per_second": 0.534,
217
+ "step": 1625
218
+ },
219
+ {
220
+ "epoch": 14.0,
221
+ "grad_norm": 0.02085023745894432,
222
+ "learning_rate": 2.5000000000000036e-06,
223
+ "loss": 0.001,
224
+ "step": 1750
225
+ },
226
+ {
227
+ "epoch": 14.0,
228
+ "eval_accuracy": 0.9226190476190477,
229
+ "eval_loss": 0.34129947423934937,
230
+ "eval_runtime": 11.0362,
231
+ "eval_samples_per_second": 30.445,
232
+ "eval_steps_per_second": 0.544,
233
+ "step": 1750
234
+ },
235
+ {
236
+ "epoch": 15.0,
237
+ "grad_norm": 0.028393927961587906,
238
+ "learning_rate": 3.015368960704584e-07,
239
+ "loss": 0.0009,
240
+ "step": 1875
241
+ },
242
+ {
243
+ "epoch": 15.0,
244
+ "eval_accuracy": 0.9226190476190477,
245
+ "eval_loss": 0.3424765169620514,
246
+ "eval_runtime": 10.9571,
247
+ "eval_samples_per_second": 30.665,
248
+ "eval_steps_per_second": 0.548,
249
+ "step": 1875
250
+ },
251
+ {
252
+ "epoch": 16.0,
253
+ "grad_norm": 0.018229400739073753,
254
+ "learning_rate": 9.698463103929542e-06,
255
+ "loss": 0.0009,
256
+ "step": 2000
257
+ },
258
+ {
259
+ "epoch": 16.0,
260
+ "eval_accuracy": 0.9226190476190477,
261
+ "eval_loss": 0.3481498956680298,
262
+ "eval_runtime": 11.0764,
263
+ "eval_samples_per_second": 30.335,
264
+ "eval_steps_per_second": 0.542,
265
+ "step": 2000
266
+ },
267
+ {
268
+ "epoch": 17.0,
269
+ "grad_norm": 0.018818996846675873,
270
+ "learning_rate": 7.499999999999999e-06,
271
+ "loss": 0.0007,
272
+ "step": 2125
273
+ },
274
+ {
275
+ "epoch": 17.0,
276
+ "eval_accuracy": 0.9226190476190477,
277
+ "eval_loss": 0.35712891817092896,
278
+ "eval_runtime": 10.3576,
279
+ "eval_samples_per_second": 32.44,
280
+ "eval_steps_per_second": 0.579,
281
+ "step": 2125
282
+ },
283
+ {
284
+ "epoch": 18.0,
285
+ "grad_norm": 0.021823769435286522,
286
+ "learning_rate": 4.131759111665352e-06,
287
+ "loss": 0.0006,
288
+ "step": 2250
289
+ },
290
+ {
291
+ "epoch": 18.0,
292
+ "eval_accuracy": 0.9196428571428571,
293
+ "eval_loss": 0.36197924613952637,
294
+ "eval_runtime": 11.0713,
295
+ "eval_samples_per_second": 30.349,
296
+ "eval_steps_per_second": 0.542,
297
+ "step": 2250
298
+ }
299
+ ],
300
  "logging_steps": 500,
301
+ "max_steps": 1875,
302
  "num_input_tokens_seen": 0,
303
+ "num_train_epochs": 15,
304
  "save_steps": 500,
305
  "stateful_callbacks": {
306
  "TrainerControl": {
 
308
  "should_epoch_stop": false,
309
  "should_evaluate": false,
310
  "should_log": false,
311
+ "should_save": true,
312
  "should_training_stop": false
313
  },
314
  "attributes": {}
315
  }
316
  },
317
+ "total_flos": 1.1159446583771136e+19,
318
  "train_batch_size": 64,
319
  "trial_name": null,
320
  "trial_params": null