varcoder commited on
Commit
b7e7a49
·
verified ·
1 Parent(s): 22caa92

End of training

Browse files
README.md CHANGED
@@ -17,8 +17,8 @@ should probably proofread and complete it, then remove this comment. -->
17
 
18
  This model is a fine-tuned version of [microsoft/resnet-101](https://huggingface.co/microsoft/resnet-101) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
- - Loss: 0.3549
21
- - Accuracy: 0.8691
22
 
23
  ## Model description
24
 
 
17
 
18
  This model is a fine-tuned version of [microsoft/resnet-101](https://huggingface.co/microsoft/resnet-101) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
+ - Loss: 0.3590
21
+ - Accuracy: 0.8716
22
 
23
  ## Model description
24
 
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "epoch": 15.0,
3
- "eval_accuracy": 0.8568627450980392,
4
- "eval_loss": 0.3784649968147278,
5
- "eval_runtime": 25.0793,
6
- "eval_samples_per_second": 81.342,
7
- "eval_steps_per_second": 2.552,
8
- "total_flos": 4.700892636385505e+18,
9
- "train_loss": 0.7059793472290039,
10
- "train_runtime": 3152.3203,
11
- "train_samples_per_second": 38.824,
12
- "train_steps_per_second": 0.081
13
  }
 
1
  {
2
+ "epoch": 9.8,
3
+ "eval_accuracy": 0.8715686274509804,
4
+ "eval_loss": 0.3589998185634613,
5
+ "eval_runtime": 34.1863,
6
+ "eval_samples_per_second": 59.673,
7
+ "eval_steps_per_second": 1.872,
8
+ "total_flos": 7.501244449451129e+18,
9
+ "train_loss": 0.7515069055557251,
10
+ "train_runtime": 2638.4717,
11
+ "train_samples_per_second": 30.923,
12
+ "train_steps_per_second": 0.095
13
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 15.0,
3
- "eval_accuracy": 0.8568627450980392,
4
- "eval_loss": 0.3784649968147278,
5
- "eval_runtime": 25.0793,
6
- "eval_samples_per_second": 81.342,
7
- "eval_steps_per_second": 2.552
8
  }
 
1
  {
2
+ "epoch": 9.8,
3
+ "eval_accuracy": 0.8715686274509804,
4
+ "eval_loss": 0.3589998185634613,
5
+ "eval_runtime": 34.1863,
6
+ "eval_samples_per_second": 59.673,
7
+ "eval_steps_per_second": 1.872
8
  }
runs/Feb02_03-29-40_ae322b9c3506/events.out.tfevents.1706847275.ae322b9c3506.3394.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d4f149d568f278686d72523c6682cd0f8c8c5e5643377e506e196ea43949239
3
+ size 411
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 15.0,
3
- "total_flos": 4.700892636385505e+18,
4
- "train_loss": 0.7059793472290039,
5
- "train_runtime": 3152.3203,
6
- "train_samples_per_second": 38.824,
7
- "train_steps_per_second": 0.081
8
  }
 
1
  {
2
+ "epoch": 9.8,
3
+ "total_flos": 7.501244449451129e+18,
4
+ "train_loss": 0.7515069055557251,
5
+ "train_runtime": 2638.4717,
6
+ "train_samples_per_second": 30.923,
7
+ "train_steps_per_second": 0.095
8
  }
trainer_state.json CHANGED
@@ -1,265 +1,268 @@
1
  {
2
- "best_metric": 0.8568627450980392,
3
- "best_model_checkpoint": "resnet-101-finetuned-CivilEng11k/checkpoint-238",
4
- "epoch": 15.0,
5
  "eval_steps": 500,
6
- "global_step": 255,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.88,
13
- "learning_rate": 0.00017307692307692304,
14
- "loss": 2.6258,
15
- "step": 15
16
  },
17
  {
18
- "epoch": 1.0,
19
- "eval_accuracy": 0.5504901960784314,
20
- "eval_loss": 2.5047667026519775,
21
- "eval_runtime": 36.2965,
22
- "eval_samples_per_second": 56.204,
23
- "eval_steps_per_second": 1.763,
24
- "step": 17
25
  },
26
  {
27
- "epoch": 1.76,
28
- "learning_rate": 0.0002947598253275109,
29
- "loss": 2.2924,
 
 
 
 
 
 
 
 
 
30
  "step": 30
31
  },
 
 
 
 
 
 
 
 
 
 
 
 
32
  {
33
  "epoch": 2.0,
34
- "eval_accuracy": 0.5274509803921569,
35
- "eval_loss": 1.4727771282196045,
36
- "eval_runtime": 37.3662,
37
- "eval_samples_per_second": 54.595,
38
- "eval_steps_per_second": 1.713,
39
- "step": 34
40
- },
41
- {
42
- "epoch": 2.65,
43
- "learning_rate": 0.00027510917030567684,
44
- "loss": 1.452,
45
- "step": 45
46
- },
47
- {
48
- "epoch": 3.0,
49
- "eval_accuracy": 0.6950980392156862,
50
- "eval_loss": 1.0708895921707153,
51
- "eval_runtime": 36.9842,
52
- "eval_samples_per_second": 55.159,
53
- "eval_steps_per_second": 1.73,
54
  "step": 51
55
  },
56
  {
57
- "epoch": 3.53,
58
- "learning_rate": 0.0002554585152838428,
59
- "loss": 1.0363,
60
  "step": 60
61
  },
62
  {
63
- "epoch": 4.0,
64
- "eval_accuracy": 0.7710784313725491,
65
- "eval_loss": 0.6555339694023132,
66
- "eval_runtime": 36.72,
67
- "eval_samples_per_second": 55.556,
68
- "eval_steps_per_second": 1.743,
69
- "step": 68
70
  },
71
  {
72
- "epoch": 4.41,
73
- "learning_rate": 0.0002358078602620087,
74
- "loss": 0.7086,
75
- "step": 75
 
 
 
76
  },
77
  {
78
- "epoch": 5.0,
79
- "eval_accuracy": 0.8122549019607843,
80
- "eval_loss": 0.4875487685203552,
81
- "eval_runtime": 37.4307,
82
- "eval_samples_per_second": 54.501,
83
- "eval_steps_per_second": 1.71,
84
- "step": 85
85
  },
86
  {
87
- "epoch": 5.29,
88
- "learning_rate": 0.00021615720524017465,
89
- "loss": 0.5185,
90
  "step": 90
91
  },
92
  {
93
- "epoch": 6.0,
94
- "eval_accuracy": 0.8357843137254902,
95
- "eval_loss": 0.43364840745925903,
96
- "eval_runtime": 37.5452,
97
- "eval_samples_per_second": 54.334,
98
- "eval_steps_per_second": 1.705,
99
- "step": 102
100
  },
101
  {
102
- "epoch": 6.18,
103
- "learning_rate": 0.00019650655021834058,
104
- "loss": 0.4238,
105
- "step": 105
 
 
 
106
  },
107
  {
108
- "epoch": 7.0,
109
- "eval_accuracy": 0.8509803921568627,
110
- "eval_loss": 0.3962140381336212,
111
- "eval_runtime": 39.9756,
112
- "eval_samples_per_second": 51.031,
113
- "eval_steps_per_second": 1.601,
114
- "step": 119
115
  },
116
  {
117
- "epoch": 7.06,
118
- "learning_rate": 0.00017685589519650654,
119
- "loss": 0.3846,
120
  "step": 120
121
  },
122
  {
123
- "epoch": 7.94,
124
- "learning_rate": 0.00015720524017467246,
125
- "loss": 0.3436,
126
- "step": 135
 
 
 
127
  },
128
  {
129
- "epoch": 8.0,
130
- "eval_accuracy": 0.8514705882352941,
131
- "eval_loss": 0.3823707103729248,
132
- "eval_runtime": 40.0175,
133
- "eval_samples_per_second": 50.978,
134
- "eval_steps_per_second": 1.599,
135
- "step": 136
 
 
 
136
  },
137
  {
138
- "epoch": 8.82,
139
- "learning_rate": 0.00013755458515283842,
140
- "loss": 0.3185,
141
  "step": 150
142
  },
143
  {
144
- "epoch": 9.0,
145
- "eval_accuracy": 0.8514705882352941,
146
- "eval_loss": 0.38265544176101685,
147
- "eval_runtime": 39.6707,
148
- "eval_samples_per_second": 51.423,
149
- "eval_steps_per_second": 1.613,
150
  "step": 153
151
  },
152
  {
153
- "epoch": 9.71,
154
- "learning_rate": 0.00011790393013100435,
155
- "loss": 0.3116,
156
- "step": 165
157
  },
158
  {
159
- "epoch": 10.0,
160
- "eval_accuracy": 0.8534313725490196,
161
- "eval_loss": 0.37894687056541443,
162
- "eval_runtime": 38.7692,
163
- "eval_samples_per_second": 52.619,
164
- "eval_steps_per_second": 1.651,
165
  "step": 170
166
  },
167
  {
168
- "epoch": 10.59,
169
- "learning_rate": 9.825327510917029e-05,
170
- "loss": 0.2983,
 
 
 
 
 
 
 
 
 
171
  "step": 180
172
  },
173
  {
174
- "epoch": 11.0,
175
- "eval_accuracy": 0.8558823529411764,
176
- "eval_loss": 0.3759206235408783,
177
- "eval_runtime": 38.4006,
178
- "eval_samples_per_second": 53.124,
179
- "eval_steps_per_second": 1.667,
180
- "step": 187
181
  },
182
  {
183
- "epoch": 11.47,
184
- "learning_rate": 7.860262008733623e-05,
185
- "loss": 0.2703,
186
- "step": 195
187
  },
188
  {
189
- "epoch": 12.0,
190
- "eval_accuracy": 0.8480392156862745,
191
- "eval_loss": 0.3838962912559509,
192
- "eval_runtime": 38.2843,
193
- "eval_samples_per_second": 53.286,
194
- "eval_steps_per_second": 1.672,
195
  "step": 204
196
  },
197
  {
198
- "epoch": 12.35,
199
- "learning_rate": 5.8951965065502174e-05,
200
- "loss": 0.2618,
201
  "step": 210
202
  },
203
  {
204
- "epoch": 13.0,
205
- "eval_accuracy": 0.8539215686274509,
206
- "eval_loss": 0.38307902216911316,
207
- "eval_runtime": 38.0757,
208
- "eval_samples_per_second": 53.577,
209
- "eval_steps_per_second": 1.681,
210
- "step": 221
211
  },
212
  {
213
- "epoch": 13.24,
214
- "learning_rate": 3.9301310043668116e-05,
215
- "loss": 0.2613,
216
- "step": 225
 
 
 
217
  },
218
  {
219
- "epoch": 14.0,
220
- "eval_accuracy": 0.8568627450980392,
221
- "eval_loss": 0.3784649968147278,
222
- "eval_runtime": 38.1613,
223
- "eval_samples_per_second": 53.457,
224
- "eval_steps_per_second": 1.677,
225
- "step": 238
226
  },
227
  {
228
- "epoch": 14.12,
229
- "learning_rate": 1.9650655021834058e-05,
230
- "loss": 0.2514,
231
  "step": 240
232
  },
233
  {
234
- "epoch": 15.0,
235
  "learning_rate": 0.0,
236
- "loss": 0.2428,
237
- "step": 255
238
- },
239
- {
240
- "epoch": 15.0,
241
- "eval_accuracy": 0.8470588235294118,
242
- "eval_loss": 0.39441215991973877,
243
- "eval_runtime": 38.4101,
244
- "eval_samples_per_second": 53.111,
245
- "eval_steps_per_second": 1.666,
246
- "step": 255
247
- },
248
- {
249
- "epoch": 15.0,
250
- "step": 255,
251
- "total_flos": 4.700892636385505e+18,
252
- "train_loss": 0.7059793472290039,
253
- "train_runtime": 3152.3203,
254
- "train_samples_per_second": 38.824,
255
- "train_steps_per_second": 0.081
256
  }
257
  ],
258
- "logging_steps": 15,
259
- "max_steps": 255,
260
- "num_train_epochs": 15,
261
  "save_steps": 500,
262
- "total_flos": 4.700892636385505e+18,
263
  "trial_name": null,
264
  "trial_params": null
265
  }
 
1
  {
2
+ "best_metric": 0.8715686274509804,
3
+ "best_model_checkpoint": "resnet-101-finetuned-CivilEng11k/checkpoint-204",
4
+ "epoch": 9.803921568627452,
5
  "eval_steps": 500,
6
+ "global_step": 250,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.39,
13
+ "learning_rate": 0.00011999999999999999,
14
+ "loss": 2.6064,
15
+ "step": 10
16
  },
17
  {
18
+ "epoch": 0.78,
19
+ "learning_rate": 0.00023999999999999998,
20
+ "loss": 2.4679,
21
+ "step": 20
 
 
 
22
  },
23
  {
24
+ "epoch": 0.98,
25
+ "eval_accuracy": 0.5367647058823529,
26
+ "eval_loss": 1.9448940753936768,
27
+ "eval_runtime": 41.2734,
28
+ "eval_samples_per_second": 49.426,
29
+ "eval_steps_per_second": 1.551,
30
+ "step": 25
31
+ },
32
+ {
33
+ "epoch": 1.18,
34
+ "learning_rate": 0.00029333333333333327,
35
+ "loss": 1.9417,
36
  "step": 30
37
  },
38
+ {
39
+ "epoch": 1.57,
40
+ "learning_rate": 0.00028,
41
+ "loss": 1.3729,
42
+ "step": 40
43
+ },
44
+ {
45
+ "epoch": 1.96,
46
+ "learning_rate": 0.0002666666666666666,
47
+ "loss": 1.2247,
48
+ "step": 50
49
+ },
50
  {
51
  "epoch": 2.0,
52
+ "eval_accuracy": 0.6799019607843138,
53
+ "eval_loss": 1.1000670194625854,
54
+ "eval_runtime": 42.9676,
55
+ "eval_samples_per_second": 47.478,
56
+ "eval_steps_per_second": 1.489,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
57
  "step": 51
58
  },
59
  {
60
+ "epoch": 2.35,
61
+ "learning_rate": 0.00025333333333333333,
62
+ "loss": 1.062,
63
  "step": 60
64
  },
65
  {
66
+ "epoch": 2.75,
67
+ "learning_rate": 0.00023999999999999998,
68
+ "loss": 0.8434,
69
+ "step": 70
 
 
 
70
  },
71
  {
72
+ "epoch": 2.98,
73
+ "eval_accuracy": 0.7887254901960784,
74
+ "eval_loss": 0.5851422548294067,
75
+ "eval_runtime": 40.7115,
76
+ "eval_samples_per_second": 50.109,
77
+ "eval_steps_per_second": 1.572,
78
+ "step": 76
79
  },
80
  {
81
+ "epoch": 3.14,
82
+ "learning_rate": 0.00022666666666666663,
83
+ "loss": 0.6665,
84
+ "step": 80
 
 
 
85
  },
86
  {
87
+ "epoch": 3.53,
88
+ "learning_rate": 0.00021333333333333333,
89
+ "loss": 0.5464,
90
  "step": 90
91
  },
92
  {
93
+ "epoch": 3.92,
94
+ "learning_rate": 0.00019999999999999998,
95
+ "loss": 0.491,
96
+ "step": 100
 
 
 
97
  },
98
  {
99
+ "epoch": 4.0,
100
+ "eval_accuracy": 0.8338235294117647,
101
+ "eval_loss": 0.43349361419677734,
102
+ "eval_runtime": 41.9829,
103
+ "eval_samples_per_second": 48.591,
104
+ "eval_steps_per_second": 1.524,
105
+ "step": 102
106
  },
107
  {
108
+ "epoch": 4.31,
109
+ "learning_rate": 0.00018666666666666666,
110
+ "loss": 0.4475,
111
+ "step": 110
 
 
 
112
  },
113
  {
114
+ "epoch": 4.71,
115
+ "learning_rate": 0.0001733333333333333,
116
+ "loss": 0.4512,
117
  "step": 120
118
  },
119
  {
120
+ "epoch": 4.98,
121
+ "eval_accuracy": 0.8401960784313726,
122
+ "eval_loss": 0.40097689628601074,
123
+ "eval_runtime": 40.6062,
124
+ "eval_samples_per_second": 50.239,
125
+ "eval_steps_per_second": 1.576,
126
+ "step": 127
127
  },
128
  {
129
+ "epoch": 5.1,
130
+ "learning_rate": 0.00015999999999999999,
131
+ "loss": 0.4392,
132
+ "step": 130
133
+ },
134
+ {
135
+ "epoch": 5.49,
136
+ "learning_rate": 0.00014666666666666664,
137
+ "loss": 0.4147,
138
+ "step": 140
139
  },
140
  {
141
+ "epoch": 5.88,
142
+ "learning_rate": 0.0001333333333333333,
143
+ "loss": 0.3891,
144
  "step": 150
145
  },
146
  {
147
+ "epoch": 6.0,
148
+ "eval_accuracy": 0.8544117647058823,
149
+ "eval_loss": 0.38171347975730896,
150
+ "eval_runtime": 43.7502,
151
+ "eval_samples_per_second": 46.628,
152
+ "eval_steps_per_second": 1.463,
153
  "step": 153
154
  },
155
  {
156
+ "epoch": 6.27,
157
+ "learning_rate": 0.00011999999999999999,
158
+ "loss": 0.3902,
159
+ "step": 160
160
  },
161
  {
162
+ "epoch": 6.67,
163
+ "learning_rate": 0.00010666666666666667,
164
+ "loss": 0.3533,
 
 
 
165
  "step": 170
166
  },
167
  {
168
+ "epoch": 6.98,
169
+ "eval_accuracy": 0.8602941176470589,
170
+ "eval_loss": 0.3679962158203125,
171
+ "eval_runtime": 38.6694,
172
+ "eval_samples_per_second": 52.755,
173
+ "eval_steps_per_second": 1.655,
174
+ "step": 178
175
+ },
176
+ {
177
+ "epoch": 7.06,
178
+ "learning_rate": 9.333333333333333e-05,
179
+ "loss": 0.3553,
180
  "step": 180
181
  },
182
  {
183
+ "epoch": 7.45,
184
+ "learning_rate": 7.999999999999999e-05,
185
+ "loss": 0.352,
186
+ "step": 190
 
 
 
187
  },
188
  {
189
+ "epoch": 7.84,
190
+ "learning_rate": 6.666666666666666e-05,
191
+ "loss": 0.3407,
192
+ "step": 200
193
  },
194
  {
195
+ "epoch": 8.0,
196
+ "eval_accuracy": 0.8715686274509804,
197
+ "eval_loss": 0.3589998185634613,
198
+ "eval_runtime": 31.761,
199
+ "eval_samples_per_second": 64.23,
200
+ "eval_steps_per_second": 2.015,
201
  "step": 204
202
  },
203
  {
204
+ "epoch": 8.24,
205
+ "learning_rate": 5.333333333333333e-05,
206
+ "loss": 0.351,
207
  "step": 210
208
  },
209
  {
210
+ "epoch": 8.63,
211
+ "learning_rate": 3.9999999999999996e-05,
212
+ "loss": 0.3244,
213
+ "step": 220
 
 
 
214
  },
215
  {
216
+ "epoch": 8.98,
217
+ "eval_accuracy": 0.8661764705882353,
218
+ "eval_loss": 0.36056193709373474,
219
+ "eval_runtime": 34.9574,
220
+ "eval_samples_per_second": 58.357,
221
+ "eval_steps_per_second": 1.831,
222
+ "step": 229
223
  },
224
  {
225
+ "epoch": 9.02,
226
+ "learning_rate": 2.6666666666666667e-05,
227
+ "loss": 0.3148,
228
+ "step": 230
 
 
 
229
  },
230
  {
231
+ "epoch": 9.41,
232
+ "learning_rate": 1.3333333333333333e-05,
233
+ "loss": 0.3156,
234
  "step": 240
235
  },
236
  {
237
+ "epoch": 9.8,
238
  "learning_rate": 0.0,
239
+ "loss": 0.3258,
240
+ "step": 250
241
+ },
242
+ {
243
+ "epoch": 9.8,
244
+ "eval_accuracy": 0.8691176470588236,
245
+ "eval_loss": 0.3549394905567169,
246
+ "eval_runtime": 38.198,
247
+ "eval_samples_per_second": 53.406,
248
+ "eval_steps_per_second": 1.675,
249
+ "step": 250
250
+ },
251
+ {
252
+ "epoch": 9.8,
253
+ "step": 250,
254
+ "total_flos": 7.501244449451129e+18,
255
+ "train_loss": 0.7515069055557251,
256
+ "train_runtime": 2638.4717,
257
+ "train_samples_per_second": 30.923,
258
+ "train_steps_per_second": 0.095
259
  }
260
  ],
261
+ "logging_steps": 10,
262
+ "max_steps": 250,
263
+ "num_train_epochs": 10,
264
  "save_steps": 500,
265
+ "total_flos": 7.501244449451129e+18,
266
  "trial_name": null,
267
  "trial_params": null
268
  }