Baselhany commited on
Commit
44d26b5
·
verified ·
1 Parent(s): b561a4b

Training in progress, epoch 13, checkpoint

Browse files
last-checkpoint/generation_config.json CHANGED
@@ -65,20 +65,7 @@
65
  "1": "LABEL_1"
66
  },
67
  "init_std": 0.02,
68
- "input_ids": [
69
- [
70
- 1,
71
- 50272
72
- ],
73
- [
74
- 2,
75
- 50359
76
- ],
77
- [
78
- 3,
79
- 50363
80
- ]
81
- ],
82
  "is_decoder": false,
83
  "is_encoder_decoder": true,
84
  "is_multilingual": true,
 
65
  "1": "LABEL_1"
66
  },
67
  "init_std": 0.02,
68
+ "input_ids": null,
 
 
 
 
 
 
 
 
 
 
 
 
 
69
  "is_decoder": false,
70
  "is_encoder_decoder": true,
71
  "is_multilingual": true,
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fe05555510ebc55c4665edcb6454f5a98c203d73607b74b65485054a8f22985b
3
  size 223144592
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c11e59e81088d0e16b8735b6e597fec79f32d290e36d8def6b66cbbc9e8cd9a1
3
  size 223144592
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fd7cddb83bff0f688d9d17ae32e3307362f9136346d658e1851dc85b10499958
3
  size 281574266
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:104d77fcd199b8f340fb5fd3f8f129fe23300d5bc5c65964c445674c40b1ea3c
3
  size 281574266
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3750103d3d13774fbde9af71a1b620bee7b1f3fd3b4d85d56883589c78d71bd4
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e08d413e62216cbe63b70a91998470669d513dd371df2cba7b0ead107f19599
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:63f4c85a973f911d833e8fedb04651de698e4b737fa13407117e3027064f11ba
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7aefee4fd3e11c00d12d383dcb2394d9676c073e8b3c3644d024cad7798c0188
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9c6c3abe9ceb62539c5bc66c9459beb276c796c31f0262d8a4d34c48cc845a28
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b9874aa9a588ea803e346f0e1d9fe34891d4c784b3be0ae24270743f1766186
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 4680,
3
  "best_metric": 0.2625994694960212,
4
  "best_model_checkpoint": "./distil-whisper/checkpoint-4680",
5
- "epoch": 14.9536,
6
  "eval_steps": 500,
7
- "global_step": 4680,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -465,12 +465,35 @@
465
  "eval_steps_per_second": 0.407,
466
  "eval_wer": 0.2625994694960212,
467
  "step": 4680
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
468
  }
469
  ],
470
  "logging_steps": 100,
471
- "max_steps": 4680,
472
  "num_input_tokens_seen": 0,
473
- "num_train_epochs": 15,
474
  "save_steps": 500,
475
  "stateful_callbacks": {
476
  "TrainerControl": {
@@ -479,12 +502,12 @@
479
  "should_evaluate": false,
480
  "should_log": false,
481
  "should_save": true,
482
- "should_training_stop": true
483
  },
484
  "attributes": {}
485
  }
486
  },
487
- "total_flos": 6.07873860108288e+18,
488
  "train_batch_size": 8,
489
  "trial_name": null,
490
  "trial_params": null
 
2
  "best_global_step": 4680,
3
  "best_metric": 0.2625994694960212,
4
  "best_model_checkpoint": "./distil-whisper/checkpoint-4680",
5
+ "epoch": 13.0,
6
  "eval_steps": 500,
7
+ "global_step": 4875,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
465
  "eval_steps_per_second": 0.407,
466
  "eval_wer": 0.2625994694960212,
467
  "step": 4680
468
+ },
469
+ {
470
+ "epoch": 12.533333333333333,
471
+ "grad_norm": 114.76351165771484,
472
+ "learning_rate": 4.021428571428572e-05,
473
+ "loss": 7.7843,
474
+ "step": 4700
475
+ },
476
+ {
477
+ "epoch": 12.8,
478
+ "grad_norm": 130.2476043701172,
479
+ "learning_rate": 3.8785714285714285e-05,
480
+ "loss": 7.0386,
481
+ "step": 4800
482
+ },
483
+ {
484
+ "epoch": 13.0,
485
+ "eval_loss": 0.12093591690063477,
486
+ "eval_runtime": 155.7693,
487
+ "eval_samples_per_second": 3.21,
488
+ "eval_steps_per_second": 0.404,
489
+ "eval_wer": 0.27600943118184496,
490
+ "step": 4875
491
  }
492
  ],
493
  "logging_steps": 100,
494
+ "max_steps": 7500,
495
  "num_input_tokens_seen": 0,
496
+ "num_train_epochs": 20,
497
  "save_steps": 500,
498
  "stateful_callbacks": {
499
  "TrainerControl": {
 
502
  "should_evaluate": false,
503
  "should_log": false,
504
  "should_save": true,
505
+ "should_training_stop": false
506
  },
507
  "attributes": {}
508
  }
509
  },
510
+ "total_flos": 6.33239878238208e+18,
511
  "train_batch_size": 8,
512
  "trial_name": null,
513
  "trial_params": null
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:800244257547555a23085083233b10cbaa528177ab8061d70f90dafa751bca41
3
- size 5496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02bfb31ca1639bb49b771e365c14935b1ca47589e808fb8789c196079d263aa1
3
+ size 5560