SodaXII commited on
Commit
00a5db7
·
verified ·
1 Parent(s): ba11535

Training in progress, epoch 1

Browse files
config.json CHANGED
@@ -48,6 +48,7 @@
48
  "out_indices": [
49
  4
50
  ],
 
51
  "stage_names": [
52
  "stem",
53
  "stage1",
 
48
  "out_indices": [
49
  4
50
  ],
51
+ "problem_type": "single_label_classification",
52
  "stage_names": [
53
  "stem",
54
  "stage1",
logs/events.out.tfevents.1740284504.a837d8c25e39.930.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8a20ef5f0d171bad8bc022f1b0428bfdec03b60be83da7ba58a80cf79fa5d52f
3
- size 88
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc76c8c2d41b07ebbb87412431c9d2f82ad6abbdecd844e27156fe31923be6b9
3
+ size 6263
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:839860602f3a191ee8ba132b71280186bb2246bff269f4c6b563f35969aaee8f
3
  size 94352152
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85767a6627f568c2d69712cc3bcd9a814fa125dc37b1607f764606474d7a7f0f
3
  size 94352152
trainer_state.json CHANGED
@@ -1,263 +1,13 @@
1
  {
2
- "best_metric": 0.8533294200897217,
3
- "best_model_checkpoint": "./drive/Shareddrives/CS198-Drones/training_output/resnet-50_rice-leaf-disease-augmented-v2_fft/checkpoint-1750",
4
- "epoch": 15.0,
5
  "eval_steps": 500,
6
- "global_step": 1875,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
- "log_history": [
11
- {
12
- "epoch": 1.0,
13
- "grad_norm": 1.1328648328781128,
14
- "learning_rate": 6.684491978609626e-06,
15
- "loss": 2.0458,
16
- "step": 125
17
- },
18
- {
19
- "epoch": 1.0,
20
- "eval_accuracy": 0.40773809523809523,
21
- "eval_loss": 1.9620426893234253,
22
- "eval_runtime": 13.3599,
23
- "eval_samples_per_second": 25.15,
24
- "eval_steps_per_second": 0.449,
25
- "step": 125
26
- },
27
- {
28
- "epoch": 2.0,
29
- "grad_norm": 1.9301390647888184,
30
- "learning_rate": 9.863149989091216e-06,
31
- "loss": 1.8522,
32
- "step": 250
33
- },
34
- {
35
- "epoch": 2.0,
36
- "eval_accuracy": 0.5297619047619048,
37
- "eval_loss": 1.7117981910705566,
38
- "eval_runtime": 13.4512,
39
- "eval_samples_per_second": 24.979,
40
- "eval_steps_per_second": 0.446,
41
- "step": 250
42
- },
43
- {
44
- "epoch": 3.0,
45
- "grad_norm": 2.323911666870117,
46
- "learning_rate": 8.824900028711128e-06,
47
- "loss": 1.6181,
48
- "step": 375
49
- },
50
- {
51
- "epoch": 3.0,
52
- "eval_accuracy": 0.5476190476190477,
53
- "eval_loss": 1.511465072631836,
54
- "eval_runtime": 13.4937,
55
- "eval_samples_per_second": 24.901,
56
- "eval_steps_per_second": 0.445,
57
- "step": 375
58
- },
59
- {
60
- "epoch": 4.0,
61
- "grad_norm": 2.650306463241577,
62
- "learning_rate": 6.973434279336284e-06,
63
- "loss": 1.4376,
64
- "step": 500
65
- },
66
- {
67
- "epoch": 4.0,
68
- "eval_accuracy": 0.6041666666666666,
69
- "eval_loss": 1.3706637620925903,
70
- "eval_runtime": 13.2381,
71
- "eval_samples_per_second": 25.381,
72
- "eval_steps_per_second": 0.453,
73
- "step": 500
74
- },
75
- {
76
- "epoch": 5.0,
77
- "grad_norm": 2.9543614387512207,
78
- "learning_rate": 4.7023947103966636e-06,
79
- "loss": 1.3093,
80
- "step": 625
81
- },
82
- {
83
- "epoch": 5.0,
84
- "eval_accuracy": 0.6220238095238095,
85
- "eval_loss": 1.2791615724563599,
86
- "eval_runtime": 13.3535,
87
- "eval_samples_per_second": 25.162,
88
- "eval_steps_per_second": 0.449,
89
- "step": 625
90
- },
91
- {
92
- "epoch": 6.0,
93
- "grad_norm": 2.6454391479492188,
94
- "learning_rate": 2.494629297272126e-06,
95
- "loss": 1.2299,
96
- "step": 750
97
- },
98
- {
99
- "epoch": 6.0,
100
- "eval_accuracy": 0.6369047619047619,
101
- "eval_loss": 1.2290029525756836,
102
- "eval_runtime": 13.6734,
103
- "eval_samples_per_second": 24.573,
104
- "eval_steps_per_second": 0.439,
105
- "step": 750
106
- },
107
- {
108
- "epoch": 7.0,
109
- "grad_norm": 3.4624359607696533,
110
- "learning_rate": 8.195332343135171e-07,
111
- "loss": 1.1881,
112
- "step": 875
113
- },
114
- {
115
- "epoch": 7.0,
116
- "eval_accuracy": 0.6398809523809523,
117
- "eval_loss": 1.2191029787063599,
118
- "eval_runtime": 13.6338,
119
- "eval_samples_per_second": 24.645,
120
- "eval_steps_per_second": 0.44,
121
- "step": 875
122
- },
123
- {
124
- "epoch": 8.0,
125
- "grad_norm": 3.2420051097869873,
126
- "learning_rate": 3.325035698205359e-08,
127
- "loss": 1.1751,
128
- "step": 1000
129
- },
130
- {
131
- "epoch": 8.0,
132
- "eval_accuracy": 0.6488095238095238,
133
- "eval_loss": 1.2101922035217285,
134
- "eval_runtime": 13.2305,
135
- "eval_samples_per_second": 25.396,
136
- "eval_steps_per_second": 0.453,
137
- "step": 1000
138
- },
139
- {
140
- "epoch": 9.0,
141
- "grad_norm": 3.5106637477874756,
142
- "learning_rate": 9.697046952264565e-06,
143
- "loss": 1.1347,
144
- "step": 1125
145
- },
146
- {
147
- "epoch": 9.0,
148
- "eval_accuracy": 0.6428571428571429,
149
- "eval_loss": 1.1266306638717651,
150
- "eval_runtime": 13.4879,
151
- "eval_samples_per_second": 24.911,
152
- "eval_steps_per_second": 0.445,
153
- "step": 1125
154
- },
155
- {
156
- "epoch": 10.0,
157
- "grad_norm": 4.020257472991943,
158
- "learning_rate": 8.428700450023544e-06,
159
- "loss": 1.0039,
160
- "step": 1250
161
- },
162
- {
163
- "epoch": 10.0,
164
- "eval_accuracy": 0.6726190476190477,
165
- "eval_loss": 1.0349254608154297,
166
- "eval_runtime": 13.2834,
167
- "eval_samples_per_second": 25.295,
168
- "eval_steps_per_second": 0.452,
169
- "step": 1250
170
- },
171
- {
172
- "epoch": 11.0,
173
- "grad_norm": 4.034997463226318,
174
- "learning_rate": 6.431374544200013e-06,
175
- "loss": 0.907,
176
- "step": 1375
177
- },
178
- {
179
- "epoch": 11.0,
180
- "eval_accuracy": 0.6934523809523809,
181
- "eval_loss": 0.9688853025436401,
182
- "eval_runtime": 13.1006,
183
- "eval_samples_per_second": 25.648,
184
- "eval_steps_per_second": 0.458,
185
- "step": 1375
186
- },
187
- {
188
- "epoch": 12.0,
189
- "grad_norm": 3.91182804107666,
190
- "learning_rate": 4.129722676764128e-06,
191
- "loss": 0.8387,
192
- "step": 1500
193
- },
194
- {
195
- "epoch": 12.0,
196
- "eval_accuracy": 0.6904761904761905,
197
- "eval_loss": 0.9262328147888184,
198
- "eval_runtime": 13.2928,
199
- "eval_samples_per_second": 25.277,
200
- "eval_steps_per_second": 0.451,
201
- "step": 1500
202
- },
203
- {
204
- "epoch": 13.0,
205
- "grad_norm": 3.1170542240142822,
206
- "learning_rate": 8.42870045002354e-06,
207
- "loss": 0.791,
208
- "step": 1625
209
- },
210
- {
211
- "epoch": 13.0,
212
- "eval_accuracy": 0.7142857142857143,
213
- "eval_loss": 0.8774951696395874,
214
- "eval_runtime": 13.2469,
215
- "eval_samples_per_second": 25.364,
216
- "eval_steps_per_second": 0.453,
217
- "step": 1625
218
- },
219
- {
220
- "epoch": 14.0,
221
- "grad_norm": 4.423528671264648,
222
- "learning_rate": 3.018018951921804e-06,
223
- "loss": 0.7244,
224
- "step": 1750
225
- },
226
- {
227
- "epoch": 14.0,
228
- "eval_accuracy": 0.7113095238095238,
229
- "eval_loss": 0.8533294200897217,
230
- "eval_runtime": 13.4659,
231
- "eval_samples_per_second": 24.952,
232
- "eval_steps_per_second": 0.446,
233
- "step": 1750
234
- },
235
- {
236
- "epoch": 15.0,
237
- "grad_norm": 4.605622291564941,
238
- "learning_rate": 0.0,
239
- "loss": 0.691,
240
- "step": 1875
241
- },
242
- {
243
- "epoch": 15.0,
244
- "eval_accuracy": 0.7202380952380952,
245
- "eval_loss": 0.8547136187553406,
246
- "eval_runtime": 15.5224,
247
- "eval_samples_per_second": 21.646,
248
- "eval_steps_per_second": 0.387,
249
- "step": 1875
250
- },
251
- {
252
- "epoch": 15.0,
253
- "step": 1875,
254
- "total_flos": 2.54958083702784e+18,
255
- "train_loss": 0.14709369303385417,
256
- "train_runtime": 1218.7812,
257
- "train_samples_per_second": 98.459,
258
- "train_steps_per_second": 1.538
259
- }
260
- ],
261
  "logging_steps": 500,
262
  "max_steps": 1875,
263
  "num_input_tokens_seen": 0,
@@ -269,13 +19,13 @@
269
  "should_epoch_stop": false,
270
  "should_evaluate": false,
271
  "should_log": false,
272
- "should_save": true,
273
- "should_training_stop": true
274
  },
275
  "attributes": {}
276
  }
277
  },
278
- "total_flos": 2.54958083702784e+18,
279
  "train_batch_size": 64,
280
  "trial_name": null,
281
  "trial_params": null
 
1
  {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 0,
5
  "eval_steps": 500,
6
+ "global_step": 0,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
+ "log_history": [],
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
11
  "logging_steps": 500,
12
  "max_steps": 1875,
13
  "num_input_tokens_seen": 0,
 
19
  "should_epoch_stop": false,
20
  "should_evaluate": false,
21
  "should_log": false,
22
+ "should_save": false,
23
+ "should_training_stop": false
24
  },
25
  "attributes": {}
26
  }
27
  },
28
+ "total_flos": 0,
29
  "train_batch_size": 64,
30
  "trial_name": null,
31
  "trial_params": null