aalonso-developer commited on
Commit
f2e57e2
·
1 Parent(s): f21b3d8

🍻 cheers

Browse files
all_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
- "epoch": 2.21,
3
- "eval_accuracy": 0.704446442154761,
4
- "eval_loss": 1.016680121421814,
5
- "eval_runtime": 152.7892,
6
- "eval_samples_per_second": 189.294,
7
- "eval_steps_per_second": 23.667,
8
- "train_loss": 0.965315860748291,
9
- "train_runtime": 7707.001,
10
- "train_samples_per_second": 150.108,
11
- "train_steps_per_second": 4.691
12
  }
 
1
  {
2
+ "epoch": 2.49,
3
+ "eval_accuracy": 0.7163750777954498,
4
+ "eval_loss": 0.9792525172233582,
5
+ "eval_runtime": 155.2753,
6
+ "eval_samples_per_second": 186.263,
7
+ "eval_steps_per_second": 23.288,
8
+ "train_loss": 0.9232679036458333,
9
+ "train_runtime": 8603.1753,
10
+ "train_samples_per_second": 134.472,
11
+ "train_steps_per_second": 4.203
12
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 2.21,
3
- "eval_accuracy": 0.704446442154761,
4
- "eval_loss": 1.016680121421814,
5
- "eval_runtime": 152.7892,
6
- "eval_samples_per_second": 189.294,
7
- "eval_steps_per_second": 23.667
8
  }
 
1
  {
2
+ "epoch": 2.49,
3
+ "eval_accuracy": 0.7163750777954498,
4
+ "eval_loss": 0.9792525172233582,
5
+ "eval_runtime": 155.2753,
6
+ "eval_samples_per_second": 186.263,
7
+ "eval_steps_per_second": 23.288
8
  }
runs/May28_21-20-54_adrian-development/events.out.tfevents.1685310471.adrian-development.89081.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e447789ec67dc46db5a3c4c34da1588a275dcfbb741973a9a3dc72541925923
3
+ size 369
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "epoch": 2.21,
3
- "train_loss": 0.965315860748291,
4
- "train_runtime": 7707.001,
5
- "train_samples_per_second": 150.108,
6
- "train_steps_per_second": 4.691
7
  }
 
1
  {
2
+ "epoch": 2.49,
3
+ "train_loss": 0.9232679036458333,
4
+ "train_runtime": 8603.1753,
5
+ "train_samples_per_second": 134.472,
6
+ "train_steps_per_second": 4.203
7
  }
trainer_state.json CHANGED
@@ -1,265 +1,295 @@
1
  {
2
- "best_metric": 1.016680121421814,
3
  "best_model_checkpoint": "Transformers/vit-base-clothing-leafs-example-full-simple/checkpoint-13000",
4
- "epoch": 2.212695339510441,
5
- "global_step": 16000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 0.14,
12
- "learning_rate": 9.723413082561195e-05,
13
- "loss": 1.5425,
14
  "step": 1000
15
  },
16
  {
17
  "epoch": 0.14,
18
- "eval_accuracy": 0.6361593250812531,
19
- "eval_loss": 1.2916964292526245,
20
- "eval_runtime": 156.1905,
21
- "eval_samples_per_second": 185.171,
22
- "eval_steps_per_second": 23.151,
23
  "step": 1000
24
  },
25
  {
26
  "epoch": 0.28,
27
- "learning_rate": 9.44682616512239e-05,
28
- "loss": 1.2,
29
  "step": 2000
30
  },
31
  {
32
  "epoch": 0.28,
33
- "eval_accuracy": 0.663439596155176,
34
- "eval_loss": 1.1727856397628784,
35
- "eval_runtime": 154.4853,
36
- "eval_samples_per_second": 187.215,
37
- "eval_steps_per_second": 23.407,
38
  "step": 2000
39
  },
40
  {
41
  "epoch": 0.41,
42
- "learning_rate": 9.170515834601023e-05,
43
- "loss": 1.1415,
44
  "step": 3000
45
  },
46
  {
47
  "epoch": 0.41,
48
- "eval_accuracy": 0.6729133531567665,
49
- "eval_loss": 1.1330761909484863,
50
- "eval_runtime": 154.2347,
51
- "eval_samples_per_second": 187.519,
52
- "eval_steps_per_second": 23.445,
53
  "step": 3000
54
  },
55
  {
56
  "epoch": 0.55,
57
- "learning_rate": 8.894205504079658e-05,
58
- "loss": 1.1054,
59
  "step": 4000
60
  },
61
  {
62
  "epoch": 0.55,
63
- "eval_accuracy": 0.68145356476039,
64
- "eval_loss": 1.092808723449707,
65
- "eval_runtime": 156.3316,
66
- "eval_samples_per_second": 185.004,
67
- "eval_steps_per_second": 23.13,
68
  "step": 4000
69
  },
70
  {
71
  "epoch": 0.69,
72
- "learning_rate": 8.617618586640852e-05,
73
- "loss": 1.0592,
74
  "step": 5000
75
  },
76
  {
77
  "epoch": 0.69,
78
- "eval_accuracy": 0.6865016250605076,
79
- "eval_loss": 1.0824187994003296,
80
- "eval_runtime": 155.4175,
81
- "eval_samples_per_second": 186.092,
82
- "eval_steps_per_second": 23.266,
83
  "step": 5000
84
  },
85
  {
86
  "epoch": 0.83,
87
- "learning_rate": 8.341031669202047e-05,
88
- "loss": 1.0516,
89
  "step": 6000
90
  },
91
  {
92
  "epoch": 0.83,
93
- "eval_accuracy": 0.6868128068598299,
94
- "eval_loss": 1.07091224193573,
95
- "eval_runtime": 153.8441,
96
- "eval_samples_per_second": 187.996,
97
- "eval_steps_per_second": 23.504,
98
  "step": 6000
99
  },
100
  {
101
  "epoch": 0.97,
102
- "learning_rate": 8.06499792559812e-05,
103
- "loss": 1.0335,
104
  "step": 7000
105
  },
106
  {
107
  "epoch": 0.97,
108
- "eval_accuracy": 0.6915496853606251,
109
- "eval_loss": 1.0542349815368652,
110
- "eval_runtime": 154.6828,
111
- "eval_samples_per_second": 186.976,
112
- "eval_steps_per_second": 23.377,
113
  "step": 7000
114
  },
115
  {
116
  "epoch": 1.11,
117
- "learning_rate": 7.788411008159315e-05,
118
- "loss": 0.9049,
119
  "step": 8000
120
  },
121
  {
122
  "epoch": 1.11,
123
- "eval_accuracy": 0.6960791093285388,
124
- "eval_loss": 1.0505256652832031,
125
- "eval_runtime": 154.9548,
126
- "eval_samples_per_second": 186.648,
127
- "eval_steps_per_second": 23.336,
128
  "step": 8000
129
  },
130
  {
131
  "epoch": 1.24,
132
- "learning_rate": 7.51182409072051e-05,
133
- "loss": 0.855,
134
  "step": 9000
135
  },
136
  {
137
  "epoch": 1.24,
138
- "eval_accuracy": 0.7003319272526105,
139
- "eval_loss": 1.0373600721359253,
140
- "eval_runtime": 153.7792,
141
- "eval_samples_per_second": 188.075,
142
- "eval_steps_per_second": 23.514,
143
  "step": 9000
144
  },
145
  {
146
  "epoch": 1.38,
147
- "learning_rate": 7.235237173281704e-05,
148
- "loss": 0.8416,
149
  "step": 10000
150
  },
151
  {
152
  "epoch": 1.38,
153
- "eval_accuracy": 0.6987760182559989,
154
- "eval_loss": 1.0450818538665771,
155
- "eval_runtime": 153.737,
156
- "eval_samples_per_second": 188.126,
157
- "eval_steps_per_second": 23.521,
158
  "step": 10000
159
  },
160
  {
161
  "epoch": 1.52,
162
- "learning_rate": 6.958650255842899e-05,
163
- "loss": 0.8389,
164
  "step": 11000
165
  },
166
  {
167
  "epoch": 1.52,
168
- "eval_accuracy": 0.7001936242306894,
169
- "eval_loss": 1.0445177555084229,
170
- "eval_runtime": 154.5258,
171
- "eval_samples_per_second": 187.166,
172
- "eval_steps_per_second": 23.401,
173
  "step": 11000
174
  },
175
  {
176
  "epoch": 1.66,
177
- "learning_rate": 6.682063338404095e-05,
178
- "loss": 0.8565,
179
  "step": 12000
180
  },
181
  {
182
  "epoch": 1.66,
183
- "eval_accuracy": 0.7031671392019916,
184
- "eval_loss": 1.0185155868530273,
185
- "eval_runtime": 155.9035,
186
- "eval_samples_per_second": 185.512,
187
- "eval_steps_per_second": 23.194,
188
  "step": 12000
189
  },
190
  {
191
  "epoch": 1.8,
192
- "learning_rate": 6.406029594800165e-05,
193
- "loss": 0.8621,
194
  "step": 13000
195
  },
196
  {
197
  "epoch": 1.8,
198
- "eval_accuracy": 0.704446442154761,
199
- "eval_loss": 1.016680121421814,
200
- "eval_runtime": 153.8181,
201
- "eval_samples_per_second": 188.027,
202
- "eval_steps_per_second": 23.508,
203
  "step": 13000
204
  },
205
  {
206
  "epoch": 1.94,
207
- "learning_rate": 6.129442677361361e-05,
208
- "loss": 0.8402,
209
  "step": 14000
210
  },
211
  {
212
  "epoch": 1.94,
213
- "eval_accuracy": 0.7033054422239126,
214
- "eval_loss": 1.0216416120529175,
215
- "eval_runtime": 155.4829,
216
- "eval_samples_per_second": 186.014,
217
- "eval_steps_per_second": 23.257,
218
  "step": 14000
219
  },
220
  {
221
  "epoch": 2.07,
222
- "learning_rate": 5.852855759922557e-05,
223
- "loss": 0.7132,
224
  "step": 15000
225
  },
226
  {
227
  "epoch": 2.07,
228
- "eval_accuracy": 0.7061752299287739,
229
- "eval_loss": 1.047763466835022,
230
- "eval_runtime": 154.3004,
231
- "eval_samples_per_second": 187.44,
232
- "eval_steps_per_second": 23.435,
233
  "step": 15000
234
  },
235
  {
236
  "epoch": 2.21,
237
- "learning_rate": 5.576268842483751e-05,
238
- "loss": 0.5989,
239
  "step": 16000
240
  },
241
  {
242
  "epoch": 2.21,
243
- "eval_accuracy": 0.7044810179102413,
244
- "eval_loss": 1.0767056941986084,
245
- "eval_runtime": 155.7802,
246
- "eval_samples_per_second": 185.659,
247
- "eval_steps_per_second": 23.212,
248
  "step": 16000
249
  },
250
  {
251
- "epoch": 2.21,
252
- "step": 16000,
253
- "total_flos": 3.968921951752827e+19,
254
- "train_loss": 0.965315860748291,
255
- "train_runtime": 7707.001,
256
- "train_samples_per_second": 150.108,
257
- "train_steps_per_second": 4.691
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
258
  }
259
  ],
260
  "max_steps": 36155,
261
  "num_train_epochs": 5,
262
- "total_flos": 3.968921951752827e+19,
263
  "trial_name": null,
264
  "trial_params": null
265
  }
 
1
  {
2
+ "best_metric": 0.9792525172233582,
3
  "best_model_checkpoint": "Transformers/vit-base-clothing-leafs-example-full-simple/checkpoint-13000",
4
+ "epoch": 2.489282256949246,
5
+ "global_step": 18000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 0.14,
12
+ "learning_rate": 4.8617065412805976e-05,
13
+ "loss": 1.7133,
14
  "step": 1000
15
  },
16
  {
17
  "epoch": 0.14,
18
+ "eval_accuracy": 0.6511306272042044,
19
+ "eval_loss": 1.298416018486023,
20
+ "eval_runtime": 153.5861,
21
+ "eval_samples_per_second": 188.311,
22
+ "eval_steps_per_second": 23.544,
23
  "step": 1000
24
  },
25
  {
26
  "epoch": 0.28,
27
+ "learning_rate": 4.723551376019915e-05,
28
+ "loss": 1.2132,
29
  "step": 2000
30
  },
31
  {
32
  "epoch": 0.28,
33
+ "eval_accuracy": 0.6832515040453634,
34
+ "eval_loss": 1.146278977394104,
35
+ "eval_runtime": 154.4414,
36
+ "eval_samples_per_second": 187.268,
37
+ "eval_steps_per_second": 23.413,
38
  "step": 2000
39
  },
40
  {
41
  "epoch": 0.41,
42
+ "learning_rate": 4.5853962107592315e-05,
43
+ "loss": 1.1346,
44
  "step": 3000
45
  },
46
  {
47
  "epoch": 0.41,
48
+ "eval_accuracy": 0.6904086854297766,
49
+ "eval_loss": 1.0889592170715332,
50
+ "eval_runtime": 155.3927,
51
+ "eval_samples_per_second": 186.122,
52
+ "eval_steps_per_second": 23.27,
53
  "step": 3000
54
  },
55
  {
56
  "epoch": 0.55,
57
+ "learning_rate": 4.447102752039829e-05,
58
+ "loss": 1.0888,
59
  "step": 4000
60
  },
61
  {
62
  "epoch": 0.55,
63
+ "eval_accuracy": 0.6949035336422101,
64
+ "eval_loss": 1.0718365907669067,
65
+ "eval_runtime": 154.1959,
66
+ "eval_samples_per_second": 187.567,
67
+ "eval_steps_per_second": 23.451,
68
  "step": 4000
69
  },
70
  {
71
  "epoch": 0.69,
72
+ "learning_rate": 4.308809293320426e-05,
73
+ "loss": 1.0576,
74
  "step": 5000
75
  },
76
  {
77
  "epoch": 0.69,
78
+ "eval_accuracy": 0.7007814120738538,
79
+ "eval_loss": 1.0322985649108887,
80
+ "eval_runtime": 156.7369,
81
+ "eval_samples_per_second": 184.526,
82
+ "eval_steps_per_second": 23.071,
83
  "step": 5000
84
  },
85
  {
86
  "epoch": 0.83,
87
+ "learning_rate": 4.170654128059743e-05,
88
+ "loss": 1.031,
89
  "step": 6000
90
  },
91
  {
92
  "epoch": 0.83,
93
+ "eval_accuracy": 0.7021644422930641,
94
+ "eval_loss": 1.0212959051132202,
95
+ "eval_runtime": 155.5747,
96
+ "eval_samples_per_second": 185.904,
97
+ "eval_steps_per_second": 23.243,
98
  "step": 6000
99
  },
100
  {
101
  "epoch": 0.97,
102
+ "learning_rate": 4.03236066934034e-05,
103
+ "loss": 1.0086,
104
  "step": 7000
105
  },
106
  {
107
  "epoch": 0.97,
108
+ "eval_accuracy": 0.700677684807413,
109
+ "eval_loss": 1.0171376466751099,
110
+ "eval_runtime": 156.0917,
111
+ "eval_samples_per_second": 185.289,
112
+ "eval_steps_per_second": 23.166,
113
  "step": 7000
114
  },
115
  {
116
  "epoch": 1.11,
117
+ "learning_rate": 3.894067210620938e-05,
118
+ "loss": 0.8678,
119
  "step": 8000
120
  },
121
  {
122
  "epoch": 1.11,
123
+ "eval_accuracy": 0.7091141691445958,
124
+ "eval_loss": 0.9995917081832886,
125
+ "eval_runtime": 156.6769,
126
+ "eval_samples_per_second": 184.596,
127
+ "eval_steps_per_second": 23.079,
128
  "step": 8000
129
  },
130
  {
131
  "epoch": 1.24,
132
+ "learning_rate": 3.755773751901535e-05,
133
+ "loss": 0.8331,
134
  "step": 9000
135
  },
136
  {
137
  "epoch": 1.24,
138
+ "eval_accuracy": 0.7084226540349907,
139
+ "eval_loss": 1.0052682161331177,
140
+ "eval_runtime": 156.5024,
141
+ "eval_samples_per_second": 184.802,
142
+ "eval_steps_per_second": 23.105,
143
  "step": 9000
144
  },
145
  {
146
  "epoch": 1.38,
147
+ "learning_rate": 3.617480293182133e-05,
148
+ "loss": 0.837,
149
  "step": 10000
150
  },
151
  {
152
  "epoch": 1.38,
153
+ "eval_accuracy": 0.7132286840467464,
154
+ "eval_loss": 0.9893946051597595,
155
+ "eval_runtime": 155.3223,
156
+ "eval_samples_per_second": 186.206,
157
+ "eval_steps_per_second": 23.281,
158
  "step": 10000
159
  },
160
  {
161
  "epoch": 1.52,
162
+ "learning_rate": 3.4793251279214494e-05,
163
+ "loss": 0.8405,
164
  "step": 11000
165
  },
166
  {
167
  "epoch": 1.52,
168
+ "eval_accuracy": 0.7134707143351082,
169
+ "eval_loss": 0.9912254810333252,
170
+ "eval_runtime": 155.9637,
171
+ "eval_samples_per_second": 185.441,
172
+ "eval_steps_per_second": 23.185,
173
  "step": 11000
174
  },
175
  {
176
  "epoch": 1.66,
177
+ "learning_rate": 3.341169962660766e-05,
178
+ "loss": 0.8273,
179
  "step": 12000
180
  },
181
  {
182
  "epoch": 1.66,
183
+ "eval_accuracy": 0.7159601687296867,
184
+ "eval_loss": 0.9918663501739502,
185
+ "eval_runtime": 155.3075,
186
+ "eval_samples_per_second": 186.224,
187
+ "eval_steps_per_second": 23.283,
188
  "step": 12000
189
  },
190
  {
191
  "epoch": 1.8,
192
+ "learning_rate": 3.202876503941364e-05,
193
+ "loss": 0.8371,
194
  "step": 13000
195
  },
196
  {
197
  "epoch": 1.8,
198
+ "eval_accuracy": 0.7163750777954498,
199
+ "eval_loss": 0.9792525172233582,
200
+ "eval_runtime": 155.0944,
201
+ "eval_samples_per_second": 186.48,
202
+ "eval_steps_per_second": 23.315,
203
  "step": 13000
204
  },
205
  {
206
  "epoch": 1.94,
207
+ "learning_rate": 3.064583045221961e-05,
208
+ "loss": 0.8225,
209
  "step": 14000
210
  },
211
  {
212
  "epoch": 1.94,
213
+ "eval_accuracy": 0.7162367747735288,
214
+ "eval_loss": 0.9806181788444519,
215
+ "eval_runtime": 155.9339,
216
+ "eval_samples_per_second": 185.476,
217
+ "eval_steps_per_second": 23.189,
218
  "step": 14000
219
  },
220
  {
221
  "epoch": 2.07,
222
+ "learning_rate": 2.9264278799612784e-05,
223
+ "loss": 0.7055,
224
  "step": 15000
225
  },
226
  {
227
  "epoch": 2.07,
228
+ "eval_accuracy": 0.7169628656386142,
229
+ "eval_loss": 1.0149892568588257,
230
+ "eval_runtime": 155.1376,
231
+ "eval_samples_per_second": 186.428,
232
+ "eval_steps_per_second": 23.308,
233
  "step": 15000
234
  },
235
  {
236
  "epoch": 2.21,
237
+ "learning_rate": 2.7881344212418754e-05,
238
+ "loss": 0.6012,
239
  "step": 16000
240
  },
241
  {
242
  "epoch": 2.21,
243
+ "eval_accuracy": 0.7123988659152203,
244
+ "eval_loss": 1.0372015237808228,
245
+ "eval_runtime": 155.042,
246
+ "eval_samples_per_second": 186.543,
247
+ "eval_steps_per_second": 23.323,
248
  "step": 16000
249
  },
250
  {
251
+ "epoch": 2.35,
252
+ "learning_rate": 2.649840962522473e-05,
253
+ "loss": 0.6035,
254
+ "step": 17000
255
+ },
256
+ {
257
+ "epoch": 2.35,
258
+ "eval_accuracy": 0.71236429015974,
259
+ "eval_loss": 1.0361833572387695,
260
+ "eval_runtime": 156.1808,
261
+ "eval_samples_per_second": 185.183,
262
+ "eval_steps_per_second": 23.153,
263
+ "step": 17000
264
+ },
265
+ {
266
+ "epoch": 2.49,
267
+ "learning_rate": 2.51154750380307e-05,
268
+ "loss": 0.596,
269
+ "step": 18000
270
+ },
271
+ {
272
+ "epoch": 2.49,
273
+ "eval_accuracy": 0.7120531083604177,
274
+ "eval_loss": 1.0460479259490967,
275
+ "eval_runtime": 157.7455,
276
+ "eval_samples_per_second": 183.346,
277
+ "eval_steps_per_second": 22.923,
278
+ "step": 18000
279
+ },
280
+ {
281
+ "epoch": 2.49,
282
+ "step": 18000,
283
+ "total_flos": 4.465066266677883e+19,
284
+ "train_loss": 0.9232679036458333,
285
+ "train_runtime": 8603.1753,
286
+ "train_samples_per_second": 134.472,
287
+ "train_steps_per_second": 4.203
288
  }
289
  ],
290
  "max_steps": 36155,
291
  "num_train_epochs": 5,
292
+ "total_flos": 4.465066266677883e+19,
293
  "trial_name": null,
294
  "trial_params": null
295
  }