dq158 commited on
Commit
894f5e2
·
1 Parent(s): ec3aaf6

Training in progress, epoch 10, checkpoint

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b71be19ad19a3a3e31959473f5c1a45cf3a994d2ac577b67dac440f4b30ca8e0
3
  size 2371770
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:095b3a1f6740c3523f4d618eb6e304dac8fadfe4f53deea6f89e7adff3341492
3
  size 2371770
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6223ce7959af515e2e82943538f39dc15a5eb2a27a686c90c211b2a33f14c087
3
  size 990409330
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1a76fa844f3a3191566c354079a7f4bc5694f5240c5233e76e250c0f6fce96d
3
  size 990409330
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a2f7b436e9bacdce8321c129258891cfe5297c358dd018f4af22a5983cb5b0d7
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:443ad106e89f5c225106f610ada6104a4bdb83f20e5790a9a64bb3871f9500ee
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:11944376c27fbea6ee7fff9906b50d8eeade72e136e82c5eaff059c29ff514f8
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ff0f9f47b6a148ea17a10b4a36afba9e6cfc279b51fe048a45e8fbccd92f97e
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 2.0042803287506104,
3
- "best_model_checkpoint": "dq158/coqui/checkpoint-8312",
4
- "epoch": 9.999398496240602,
5
  "eval_steps": 500,
6
- "global_step": 8312,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -293,13 +293,44 @@
293
  "eval_steps_per_second": 0.605,
294
  "eval_translation_length": 55997,
295
  "step": 8312
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
296
  }
297
  ],
298
  "logging_steps": 500,
299
  "max_steps": 16620,
300
  "num_train_epochs": 20,
301
  "save_steps": 500,
302
- "total_flos": 1.8213176060411904e+17,
303
  "trial_name": null,
304
  "trial_params": null
305
  }
 
1
  {
2
+ "best_metric": 2.0005455017089844,
3
+ "best_model_checkpoint": "dq158/coqui/checkpoint-9143",
4
+ "epoch": 10.999097744360903,
5
  "eval_steps": 500,
6
+ "global_step": 9143,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
293
  "eval_steps_per_second": 0.605,
294
  "eval_translation_length": 55997,
295
  "step": 8312
296
+ },
297
+ {
298
+ "epoch": 10.23,
299
+ "learning_rate": 4.552618528938031e-05,
300
+ "loss": 1.9494,
301
+ "step": 8500
302
+ },
303
+ {
304
+ "epoch": 10.83,
305
+ "learning_rate": 4.114594725207993e-05,
306
+ "loss": 1.9375,
307
+ "step": 9000
308
+ },
309
+ {
310
+ "epoch": 11.0,
311
+ "eval_bleu": 1.0,
312
+ "eval_brevity_penalty": 1.0,
313
+ "eval_length_ratio": 1.0,
314
+ "eval_loss": 2.0005455017089844,
315
+ "eval_precisions": [
316
+ 1.0,
317
+ 1.0,
318
+ 1.0,
319
+ 1.0
320
+ ],
321
+ "eval_reference_length": 56078,
322
+ "eval_runtime": 610.5262,
323
+ "eval_samples_per_second": 4.842,
324
+ "eval_steps_per_second": 0.606,
325
+ "eval_translation_length": 56078,
326
+ "step": 9143
327
  }
328
  ],
329
  "logging_steps": 500,
330
  "max_steps": 16620,
331
  "num_train_epochs": 20,
332
  "save_steps": 500,
333
+ "total_flos": 2.0034493666453094e+17,
334
  "trial_name": null,
335
  "trial_params": null
336
  }