dzinampini commited on
Commit
0c8d2d9
·
verified ·
1 Parent(s): 5d515a6

🍻 cheers

Browse files
README.md CHANGED
@@ -3,6 +3,7 @@ library_name: transformers
3
  license: apache-2.0
4
  base_model: google/vit-base-patch16-224-in21k
5
  tags:
 
6
  - generated_from_trainer
7
  metrics:
8
  - accuracy
@@ -19,13 +20,13 @@ should probably proofread and complete it, then remove this comment. -->
19
 
20
  # beans-leaf-disease-detection
21
 
22
- This model is a fine-tuned version of [google/vit-base-patch16-224-in21k](https://huggingface.co/google/vit-base-patch16-224-in21k) on an unknown dataset.
23
  It achieves the following results on the evaluation set:
24
- - Loss: 0.0472
25
- - Accuracy: 0.9850
26
- - Precision: 0.9856
27
- - Recall: 0.9850
28
- - F1: 0.9850
29
 
30
  ## Model description
31
 
 
3
  license: apache-2.0
4
  base_model: google/vit-base-patch16-224-in21k
5
  tags:
6
+ - image-classification
7
  - generated_from_trainer
8
  metrics:
9
  - accuracy
 
20
 
21
  # beans-leaf-disease-detection
22
 
23
+ This model is a fine-tuned version of [google/vit-base-patch16-224-in21k](https://huggingface.co/google/vit-base-patch16-224-in21k) on the beans dataset.
24
  It achieves the following results on the evaluation set:
25
+ - Loss: 0.0404
26
+ - Accuracy: 0.9925
27
+ - Precision: 0.9926
28
+ - Recall: 0.9925
29
+ - F1: 0.9925
30
 
31
  ## Model description
32
 
all_results.json CHANGED
@@ -1,16 +1,16 @@
1
  {
2
  "epoch": 4.0,
3
- "eval_accuracy": 1.0,
4
- "eval_f1": 1.0,
5
- "eval_loss": 0.014331846497952938,
6
- "eval_precision": 1.0,
7
- "eval_recall": 1.0,
8
- "eval_runtime": 3.7971,
9
- "eval_samples_per_second": 35.027,
10
- "eval_steps_per_second": 4.477,
11
  "total_flos": 3.205097416476426e+17,
12
- "train_loss": 0.11858639149711682,
13
- "train_runtime": 104.5608,
14
- "train_samples_per_second": 39.556,
15
- "train_steps_per_second": 2.487
16
  }
 
1
  {
2
  "epoch": 4.0,
3
+ "eval_accuracy": 0.9924812030075187,
4
+ "eval_f1": 0.9924802319630927,
5
+ "eval_loss": 0.04042869806289673,
6
+ "eval_precision": 0.9926482873851294,
7
+ "eval_recall": 0.9924812030075187,
8
+ "eval_runtime": 1.4609,
9
+ "eval_samples_per_second": 91.039,
10
+ "eval_steps_per_second": 11.637,
11
  "total_flos": 3.205097416476426e+17,
12
+ "train_loss": 0.04095530418249277,
13
+ "train_runtime": 294.0083,
14
+ "train_samples_per_second": 14.068,
15
+ "train_steps_per_second": 0.884
16
  }
eval_results.json CHANGED
@@ -1,11 +1,11 @@
1
  {
2
  "epoch": 4.0,
3
- "eval_accuracy": 1.0,
4
- "eval_f1": 1.0,
5
- "eval_loss": 0.014331846497952938,
6
- "eval_precision": 1.0,
7
- "eval_recall": 1.0,
8
- "eval_runtime": 3.7971,
9
- "eval_samples_per_second": 35.027,
10
- "eval_steps_per_second": 4.477
11
  }
 
1
  {
2
  "epoch": 4.0,
3
+ "eval_accuracy": 0.9924812030075187,
4
+ "eval_f1": 0.9924802319630927,
5
+ "eval_loss": 0.04042869806289673,
6
+ "eval_precision": 0.9926482873851294,
7
+ "eval_recall": 0.9924812030075187,
8
+ "eval_runtime": 1.4609,
9
+ "eval_samples_per_second": 91.039,
10
+ "eval_steps_per_second": 11.637
11
  }
runs/Apr08_12-13-15_8daea7f679cf/events.out.tfevents.1744114795.8daea7f679cf.15724.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7873338ee427a9cc0fb70bac41060bf2149b7af890a521615b19272e3efab3a6
3
+ size 560
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 4.0,
3
  "total_flos": 3.205097416476426e+17,
4
- "train_loss": 0.11858639149711682,
5
- "train_runtime": 104.5608,
6
- "train_samples_per_second": 39.556,
7
- "train_steps_per_second": 2.487
8
  }
 
1
  {
2
  "epoch": 4.0,
3
  "total_flos": 3.205097416476426e+17,
4
+ "train_loss": 0.04095530418249277,
5
+ "train_runtime": 294.0083,
6
+ "train_samples_per_second": 14.068,
7
+ "train_steps_per_second": 0.884
8
  }
trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_global_step": 200,
3
- "best_metric": 1.0,
4
  "best_model_checkpoint": "./vit-base-beans-model-finetuned/checkpoint-200",
5
  "epoch": 4.0,
6
- "eval_steps": 100,
7
  "global_step": 260,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
@@ -11,225 +11,261 @@
11
  "log_history": [
12
  {
13
  "epoch": 0.15384615384615385,
14
- "grad_norm": 1.2726824283599854,
15
  "learning_rate": 0.00019230769230769233,
16
- "loss": 0.7734,
17
  "step": 10
18
  },
19
  {
20
  "epoch": 0.3076923076923077,
21
- "grad_norm": 2.146637201309204,
22
  "learning_rate": 0.00018461538461538463,
23
- "loss": 0.2647,
24
  "step": 20
25
  },
26
  {
27
  "epoch": 0.46153846153846156,
28
- "grad_norm": 1.4233285188674927,
29
  "learning_rate": 0.00017692307692307693,
30
- "loss": 0.2683,
31
  "step": 30
32
  },
33
  {
34
  "epoch": 0.6153846153846154,
35
- "grad_norm": 0.6973394155502319,
36
  "learning_rate": 0.00016923076923076923,
37
- "loss": 0.282,
38
  "step": 40
39
  },
40
  {
41
  "epoch": 0.7692307692307693,
42
- "grad_norm": 0.30112147331237793,
43
  "learning_rate": 0.00016153846153846155,
44
- "loss": 0.1744,
 
 
 
 
 
 
 
 
 
 
 
 
45
  "step": 50
46
  },
47
  {
48
  "epoch": 0.9230769230769231,
49
- "grad_norm": 1.9841829538345337,
50
  "learning_rate": 0.00015384615384615385,
51
- "loss": 0.1775,
52
  "step": 60
53
  },
54
  {
55
  "epoch": 1.0769230769230769,
56
- "grad_norm": 0.2848643660545349,
57
  "learning_rate": 0.00014615384615384615,
58
- "loss": 0.2133,
59
  "step": 70
60
  },
61
  {
62
  "epoch": 1.2307692307692308,
63
- "grad_norm": 0.1492587774991989,
64
  "learning_rate": 0.00013846153846153847,
65
- "loss": 0.1077,
66
  "step": 80
67
  },
68
  {
69
  "epoch": 1.3846153846153846,
70
- "grad_norm": 0.22872798144817352,
71
  "learning_rate": 0.00013076923076923077,
72
- "loss": 0.0501,
73
  "step": 90
74
  },
75
  {
76
  "epoch": 1.5384615384615383,
77
- "grad_norm": 3.7855725288391113,
78
  "learning_rate": 0.0001230769230769231,
79
- "loss": 0.1638,
80
  "step": 100
81
  },
82
  {
83
  "epoch": 1.5384615384615383,
84
- "eval_accuracy": 0.9473684210526315,
85
- "eval_f1": 0.9468339901115093,
86
- "eval_loss": 0.14574794471263885,
87
- "eval_precision": 0.9514619883040936,
88
- "eval_recall": 0.9473684210526315,
89
- "eval_runtime": 2.8734,
90
- "eval_samples_per_second": 46.286,
91
- "eval_steps_per_second": 5.916,
92
  "step": 100
93
  },
94
  {
95
  "epoch": 1.6923076923076923,
96
- "grad_norm": 0.12178239226341248,
97
  "learning_rate": 0.00011538461538461538,
98
- "loss": 0.1062,
99
  "step": 110
100
  },
101
  {
102
  "epoch": 1.8461538461538463,
103
- "grad_norm": 0.16127511858940125,
104
  "learning_rate": 0.0001076923076923077,
105
- "loss": 0.082,
106
  "step": 120
107
  },
108
  {
109
  "epoch": 2.0,
110
- "grad_norm": 0.09819109737873077,
111
  "learning_rate": 0.0001,
112
- "loss": 0.107,
113
  "step": 130
114
  },
115
  {
116
  "epoch": 2.1538461538461537,
117
- "grad_norm": 6.641988754272461,
118
  "learning_rate": 9.230769230769232e-05,
119
- "loss": 0.0531,
120
  "step": 140
121
  },
122
  {
123
  "epoch": 2.3076923076923075,
124
- "grad_norm": 0.6329468488693237,
125
  "learning_rate": 8.461538461538461e-05,
126
- "loss": 0.0407,
 
 
 
 
 
 
 
 
 
 
 
 
127
  "step": 150
128
  },
129
  {
130
  "epoch": 2.4615384615384617,
131
- "grad_norm": 0.08334755897521973,
132
  "learning_rate": 7.692307692307693e-05,
133
- "loss": 0.0296,
134
  "step": 160
135
  },
136
  {
137
  "epoch": 2.6153846153846154,
138
- "grad_norm": 0.4335107207298279,
139
  "learning_rate": 6.923076923076924e-05,
140
- "loss": 0.0151,
141
  "step": 170
142
  },
143
  {
144
  "epoch": 2.769230769230769,
145
- "grad_norm": 0.07147972285747528,
146
  "learning_rate": 6.153846153846155e-05,
147
- "loss": 0.0445,
148
  "step": 180
149
  },
150
  {
151
  "epoch": 2.9230769230769234,
152
- "grad_norm": 1.928112268447876,
153
  "learning_rate": 5.384615384615385e-05,
154
- "loss": 0.0447,
155
  "step": 190
156
  },
157
  {
158
  "epoch": 3.076923076923077,
159
- "grad_norm": 0.06142687052488327,
160
  "learning_rate": 4.615384615384616e-05,
161
- "loss": 0.0156,
162
  "step": 200
163
  },
164
  {
165
  "epoch": 3.076923076923077,
166
- "eval_accuracy": 1.0,
167
- "eval_f1": 1.0,
168
- "eval_loss": 0.014331846497952938,
169
- "eval_precision": 1.0,
170
- "eval_recall": 1.0,
171
- "eval_runtime": 2.2915,
172
- "eval_samples_per_second": 58.041,
173
- "eval_steps_per_second": 7.419,
174
  "step": 200
175
  },
176
  {
177
  "epoch": 3.230769230769231,
178
- "grad_norm": 0.06270013004541397,
179
  "learning_rate": 3.846153846153846e-05,
180
- "loss": 0.0121,
181
  "step": 210
182
  },
183
  {
184
  "epoch": 3.3846153846153846,
185
- "grad_norm": 0.05996321141719818,
186
  "learning_rate": 3.0769230769230774e-05,
187
- "loss": 0.0129,
188
  "step": 220
189
  },
190
  {
191
  "epoch": 3.5384615384615383,
192
- "grad_norm": 0.06372592598199844,
193
  "learning_rate": 2.307692307692308e-05,
194
- "loss": 0.0112,
195
  "step": 230
196
  },
197
  {
198
  "epoch": 3.6923076923076925,
199
- "grad_norm": 0.055972643196582794,
200
  "learning_rate": 1.5384615384615387e-05,
201
- "loss": 0.0109,
202
  "step": 240
203
  },
204
  {
205
  "epoch": 3.8461538461538463,
206
- "grad_norm": 0.05908067896962166,
207
  "learning_rate": 7.692307692307694e-06,
208
- "loss": 0.011,
 
 
 
 
 
 
 
 
 
 
 
 
209
  "step": 250
210
  },
211
  {
212
  "epoch": 4.0,
213
- "grad_norm": 0.05994662642478943,
214
  "learning_rate": 0.0,
215
- "loss": 0.0112,
216
  "step": 260
217
  },
218
  {
219
  "epoch": 4.0,
220
  "step": 260,
221
  "total_flos": 3.205097416476426e+17,
222
- "train_loss": 0.11858639149711682,
223
- "train_runtime": 104.5608,
224
- "train_samples_per_second": 39.556,
225
- "train_steps_per_second": 2.487
226
  }
227
  ],
228
  "logging_steps": 10,
229
  "max_steps": 260,
230
  "num_input_tokens_seen": 0,
231
  "num_train_epochs": 4,
232
- "save_steps": 100,
233
  "stateful_callbacks": {
234
  "TrainerControl": {
235
  "args": {
 
1
  {
2
  "best_global_step": 200,
3
+ "best_metric": 0.9924812030075187,
4
  "best_model_checkpoint": "./vit-base-beans-model-finetuned/checkpoint-200",
5
  "epoch": 4.0,
6
+ "eval_steps": 50,
7
  "global_step": 260,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
 
11
  "log_history": [
12
  {
13
  "epoch": 0.15384615384615385,
14
+ "grad_norm": 0.046927113085985184,
15
  "learning_rate": 0.00019230769230769233,
16
+ "loss": 0.0203,
17
  "step": 10
18
  },
19
  {
20
  "epoch": 0.3076923076923077,
21
+ "grad_norm": 9.78127670288086,
22
  "learning_rate": 0.00018461538461538463,
23
+ "loss": 0.0936,
24
  "step": 20
25
  },
26
  {
27
  "epoch": 0.46153846153846156,
28
+ "grad_norm": 0.15273386240005493,
29
  "learning_rate": 0.00017692307692307693,
30
+ "loss": 0.1531,
31
  "step": 30
32
  },
33
  {
34
  "epoch": 0.6153846153846154,
35
+ "grad_norm": 0.059062909334897995,
36
  "learning_rate": 0.00016923076923076923,
37
+ "loss": 0.0808,
38
  "step": 40
39
  },
40
  {
41
  "epoch": 0.7692307692307693,
42
+ "grad_norm": 0.04636870697140694,
43
  "learning_rate": 0.00016153846153846155,
44
+ "loss": 0.0492,
45
+ "step": 50
46
+ },
47
+ {
48
+ "epoch": 0.7692307692307693,
49
+ "eval_accuracy": 0.9774436090225563,
50
+ "eval_f1": 0.9774379108058134,
51
+ "eval_loss": 0.1117313951253891,
52
+ "eval_precision": 0.9775956574956096,
53
+ "eval_recall": 0.9774436090225563,
54
+ "eval_runtime": 1.2431,
55
+ "eval_samples_per_second": 106.99,
56
+ "eval_steps_per_second": 13.675,
57
  "step": 50
58
  },
59
  {
60
  "epoch": 0.9230769230769231,
61
+ "grad_norm": 0.03537413850426674,
62
  "learning_rate": 0.00015384615384615385,
63
+ "loss": 0.1339,
64
  "step": 60
65
  },
66
  {
67
  "epoch": 1.0769230769230769,
68
+ "grad_norm": 8.806337356567383,
69
  "learning_rate": 0.00014615384615384615,
70
+ "loss": 0.0454,
71
  "step": 70
72
  },
73
  {
74
  "epoch": 1.2307692307692308,
75
+ "grad_norm": 10.037283897399902,
76
  "learning_rate": 0.00013846153846153847,
77
+ "loss": 0.0988,
78
  "step": 80
79
  },
80
  {
81
  "epoch": 1.3846153846153846,
82
+ "grad_norm": 0.030385395511984825,
83
  "learning_rate": 0.00013076923076923077,
84
+ "loss": 0.0539,
85
  "step": 90
86
  },
87
  {
88
  "epoch": 1.5384615384615383,
89
+ "grad_norm": 0.03275859355926514,
90
  "learning_rate": 0.0001230769230769231,
91
+ "loss": 0.0432,
92
  "step": 100
93
  },
94
  {
95
  "epoch": 1.5384615384615383,
96
+ "eval_accuracy": 0.9624060150375939,
97
+ "eval_f1": 0.9619558041418667,
98
+ "eval_loss": 0.14281876385211945,
99
+ "eval_precision": 0.9650282168005047,
100
+ "eval_recall": 0.9624060150375939,
101
+ "eval_runtime": 1.6279,
102
+ "eval_samples_per_second": 81.699,
103
+ "eval_steps_per_second": 10.443,
104
  "step": 100
105
  },
106
  {
107
  "epoch": 1.6923076923076923,
108
+ "grad_norm": 0.030820081010460854,
109
  "learning_rate": 0.00011538461538461538,
110
+ "loss": 0.0186,
111
  "step": 110
112
  },
113
  {
114
  "epoch": 1.8461538461538463,
115
+ "grad_norm": 0.027867253869771957,
116
  "learning_rate": 0.0001076923076923077,
117
+ "loss": 0.0827,
118
  "step": 120
119
  },
120
  {
121
  "epoch": 2.0,
122
+ "grad_norm": 0.03597959503531456,
123
  "learning_rate": 0.0001,
124
+ "loss": 0.0319,
125
  "step": 130
126
  },
127
  {
128
  "epoch": 2.1538461538461537,
129
+ "grad_norm": 0.12349524348974228,
130
  "learning_rate": 9.230769230769232e-05,
131
+ "loss": 0.0368,
132
  "step": 140
133
  },
134
  {
135
  "epoch": 2.3076923076923075,
136
+ "grad_norm": 0.3923969566822052,
137
  "learning_rate": 8.461538461538461e-05,
138
+ "loss": 0.0119,
139
+ "step": 150
140
+ },
141
+ {
142
+ "epoch": 2.3076923076923075,
143
+ "eval_accuracy": 0.9849624060150376,
144
+ "eval_f1": 0.9849605066094567,
145
+ "eval_loss": 0.07355950772762299,
146
+ "eval_precision": 0.9851258581235698,
147
+ "eval_recall": 0.9849624060150376,
148
+ "eval_runtime": 1.2553,
149
+ "eval_samples_per_second": 105.955,
150
+ "eval_steps_per_second": 13.543,
151
  "step": 150
152
  },
153
  {
154
  "epoch": 2.4615384615384617,
155
+ "grad_norm": 5.8568878173828125,
156
  "learning_rate": 7.692307692307693e-05,
157
+ "loss": 0.0635,
158
  "step": 160
159
  },
160
  {
161
  "epoch": 2.6153846153846154,
162
+ "grad_norm": 0.03230699151754379,
163
  "learning_rate": 6.923076923076924e-05,
164
+ "loss": 0.0067,
165
  "step": 170
166
  },
167
  {
168
  "epoch": 2.769230769230769,
169
+ "grad_norm": 0.02458355203270912,
170
  "learning_rate": 6.153846153846155e-05,
171
+ "loss": 0.0102,
172
  "step": 180
173
  },
174
  {
175
  "epoch": 2.9230769230769234,
176
+ "grad_norm": 0.017980379983782768,
177
  "learning_rate": 5.384615384615385e-05,
178
+ "loss": 0.0055,
179
  "step": 190
180
  },
181
  {
182
  "epoch": 3.076923076923077,
183
+ "grad_norm": 0.017595401033759117,
184
  "learning_rate": 4.615384615384616e-05,
185
+ "loss": 0.0038,
186
  "step": 200
187
  },
188
  {
189
  "epoch": 3.076923076923077,
190
+ "eval_accuracy": 0.9924812030075187,
191
+ "eval_f1": 0.9924802319630927,
192
+ "eval_loss": 0.04042869806289673,
193
+ "eval_precision": 0.9926482873851294,
194
+ "eval_recall": 0.9924812030075187,
195
+ "eval_runtime": 1.2785,
196
+ "eval_samples_per_second": 104.031,
197
+ "eval_steps_per_second": 13.297,
198
  "step": 200
199
  },
200
  {
201
  "epoch": 3.230769230769231,
202
+ "grad_norm": 0.016184426844120026,
203
  "learning_rate": 3.846153846153846e-05,
204
+ "loss": 0.0036,
205
  "step": 210
206
  },
207
  {
208
  "epoch": 3.3846153846153846,
209
+ "grad_norm": 0.016925645992159843,
210
  "learning_rate": 3.0769230769230774e-05,
211
+ "loss": 0.0037,
212
  "step": 220
213
  },
214
  {
215
  "epoch": 3.5384615384615383,
216
+ "grad_norm": 0.018014749512076378,
217
  "learning_rate": 2.307692307692308e-05,
218
+ "loss": 0.003,
219
  "step": 230
220
  },
221
  {
222
  "epoch": 3.6923076923076925,
223
+ "grad_norm": 0.016459761187434196,
224
  "learning_rate": 1.5384615384615387e-05,
225
+ "loss": 0.003,
226
  "step": 240
227
  },
228
  {
229
  "epoch": 3.8461538461538463,
230
+ "grad_norm": 0.015728654339909554,
231
  "learning_rate": 7.692307692307694e-06,
232
+ "loss": 0.0046,
233
+ "step": 250
234
+ },
235
+ {
236
+ "epoch": 3.8461538461538463,
237
+ "eval_accuracy": 0.9849624060150376,
238
+ "eval_f1": 0.9850440384831379,
239
+ "eval_loss": 0.04719630256295204,
240
+ "eval_precision": 0.9856162144491664,
241
+ "eval_recall": 0.9849624060150376,
242
+ "eval_runtime": 1.2361,
243
+ "eval_samples_per_second": 107.601,
244
+ "eval_steps_per_second": 13.753,
245
  "step": 250
246
  },
247
  {
248
  "epoch": 4.0,
249
+ "grad_norm": 0.015585985034704208,
250
  "learning_rate": 0.0,
251
+ "loss": 0.0029,
252
  "step": 260
253
  },
254
  {
255
  "epoch": 4.0,
256
  "step": 260,
257
  "total_flos": 3.205097416476426e+17,
258
+ "train_loss": 0.04095530418249277,
259
+ "train_runtime": 294.0083,
260
+ "train_samples_per_second": 14.068,
261
+ "train_steps_per_second": 0.884
262
  }
263
  ],
264
  "logging_steps": 10,
265
  "max_steps": 260,
266
  "num_input_tokens_seen": 0,
267
  "num_train_epochs": 4,
268
+ "save_steps": 50,
269
  "stateful_callbacks": {
270
  "TrainerControl": {
271
  "args": {