Yahiael1 commited on
Commit
326a39d
·
1 Parent(s): 94a84a2

Training in progress, step 15000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9dfae293f92d7ce42f799b1cfa3ff2324b449307ea5b1ffe909db5fdb43bc62e
3
  size 1115579397
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28187497dc6decd09c29c448cbe3c8f216a461b847b3dfe76c961eefcba760dd
3
  size 1115579397
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:53993b59de6e841bf87528e770e4f0d58566f5d261e3f8b554bc4ea54782393a
3
  size 557971229
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6cde4c8b5d264bfb9f8a06eee531d1d4753c6c5f780f672725d48cb200528c80
3
  size 557971229
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7350114a3b349562121e30f7b1c4e639541c40ef9b4afb3665041b3fdaa6980a
3
  size 15597
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21e8419e75fb4597ac6804eea271b8d8c7570e10eeb8b3dcf0e419dec78e3abc
3
  size 15597
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6dbc5097d3af03f81acfa53fb6f73f2a12d4ea9707e4a957c56edb34d729f7f1
3
  size 557
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4078cba31618fb628b6b959898b3af21da737bbca86995dd1501bc1bcdffba9e
3
  size 557
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7118ba55ae4b4d75ed6bdb199e80512c65f03c3b9ca20e7918b6fb4ec034c32d
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09b501e7cbbfd105661937636cf270aadedef3375bca9faacf1296b961e54ce2
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.1519631371796102,
5
- "global_step": 12000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -189,11 +189,47 @@
189
  "eval_samples_per_second": 7.655,
190
  "eval_steps_per_second": 0.383,
191
  "step": 12000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
192
  }
193
  ],
194
  "max_steps": 41668,
195
  "num_train_epochs": 4,
196
- "total_flos": 1.4630840437764096e+17,
197
  "trial_name": null,
198
  "trial_params": null
199
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.4399539214745127,
5
+ "global_step": 15000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
189
  "eval_samples_per_second": 7.655,
190
  "eval_steps_per_second": 0.383,
191
  "step": 12000
192
+ },
193
+ {
194
+ "epoch": 1.2,
195
+ "learning_rate": 0.0001400403187098013,
196
+ "loss": 1.8898,
197
+ "step": 12500
198
+ },
199
+ {
200
+ "epoch": 1.25,
201
+ "learning_rate": 0.00013764039550734377,
202
+ "loss": 1.8321,
203
+ "step": 13000
204
+ },
205
+ {
206
+ "epoch": 1.3,
207
+ "learning_rate": 0.00013524047230488627,
208
+ "loss": 1.8986,
209
+ "step": 13500
210
+ },
211
+ {
212
+ "epoch": 1.34,
213
+ "learning_rate": 0.00013284054910242874,
214
+ "loss": 1.8934,
215
+ "step": 14000
216
+ },
217
+ {
218
+ "epoch": 1.39,
219
+ "learning_rate": 0.0001304406258999712,
220
+ "loss": 1.873,
221
+ "step": 14500
222
+ },
223
+ {
224
+ "epoch": 1.44,
225
+ "learning_rate": 0.0001280407026975137,
226
+ "loss": 1.8582,
227
+ "step": 15000
228
  }
229
  ],
230
  "max_steps": 41668,
231
  "num_train_epochs": 4,
232
+ "total_flos": 1.8288586333495296e+17,
233
  "trial_name": null,
234
  "trial_params": null
235
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:53993b59de6e841bf87528e770e4f0d58566f5d261e3f8b554bc4ea54782393a
3
  size 557971229
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6cde4c8b5d264bfb9f8a06eee531d1d4753c6c5f780f672725d48cb200528c80
3
  size 557971229