Baselhany commited on
Commit
d36a099
·
verified ·
1 Parent(s): 7a58883

Training in progress, step 4400, checkpoint

Browse files
last-checkpoint/generation_config.json CHANGED
@@ -65,20 +65,7 @@
65
  "1": "LABEL_1"
66
  },
67
  "init_std": 0.02,
68
- "input_ids": [
69
- [
70
- 1,
71
- 50272
72
- ],
73
- [
74
- 2,
75
- 50359
76
- ],
77
- [
78
- 3,
79
- 50363
80
- ]
81
- ],
82
  "is_decoder": false,
83
  "is_encoder_decoder": true,
84
  "is_multilingual": true,
 
65
  "1": "LABEL_1"
66
  },
67
  "init_std": 0.02,
68
+ "input_ids": null,
 
 
 
 
 
 
 
 
 
 
 
 
 
69
  "is_decoder": false,
70
  "is_encoder_decoder": true,
71
  "is_multilingual": true,
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:69413f73615f83d9af3e012f915779e8feb55af85c0f9865e5b11ad6de4098a7
3
  size 223144592
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f40200e4b2d1a3f9598026f1d0cccc4f5b3103c0aadb8052e27f341f9a27838d
3
  size 223144592
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c26ab3bab0f78e1de1ae83243b84b339f9a73fdc9f36898bacd02627010b7e2f
3
  size 281574266
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90ed54e5fca7d5b720f092da54461547fac2b58c7298cca5427eb03096d37f9c
3
  size 281574266
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fffa34d617d37d160278a96263e54262610f7be0f6f6036d5ce9daab9c3384b4
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13153c51d9decd414ca15fdaaabc194d8395e3d59a60c4f1e9bfa5a3a8e7aa77
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:700c62e2c409fb74a77e8989f1568b7a1be716546579ac14b2d28333ee737550
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:527ed30c0082066de2b11ba3e383f402988390e42a94d94accb5601dac35d4d6
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0b18e7fa03b9a1836a4a0d45bc80a9a0024a1c8c3ed77ce70ed3080f8004f4c9
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c3512f84cd4c65eb0fe727a1e41ca960ab5dd56daf3156a40e9a12ed28a34d9
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 4000,
3
  "best_metric": 0.22192749778956675,
4
  "best_model_checkpoint": "./distil-whisper/checkpoint-4000",
5
- "epoch": 2.998396579369321,
6
  "eval_steps": 400,
7
- "global_step": 4209,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -392,12 +392,35 @@
392
  "learning_rate": 6.470746832030197e-07,
393
  "loss": 4.095,
394
  "step": 4200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
395
  }
396
  ],
397
  "logging_steps": 100,
398
- "max_steps": 4209,
399
  "num_input_tokens_seen": 0,
400
- "num_train_epochs": 3,
401
  "save_steps": 400,
402
  "stateful_callbacks": {
403
  "TrainerControl": {
@@ -406,12 +429,12 @@
406
  "should_evaluate": false,
407
  "should_log": false,
408
  "should_save": true,
409
- "should_training_stop": true
410
  },
411
  "attributes": {}
412
  }
413
  },
414
- "total_flos": 5.4727997128704e+18,
415
  "train_batch_size": 8,
416
  "trial_name": null,
417
  "trial_params": null
 
2
  "best_global_step": 4000,
3
  "best_metric": 0.22192749778956675,
4
  "best_model_checkpoint": "./distil-whisper/checkpoint-4000",
5
+ "epoch": 3.136112595759843,
6
  "eval_steps": 400,
7
+ "global_step": 4400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
392
  "learning_rate": 6.470746832030197e-07,
393
  "loss": 4.095,
394
  "step": 4200
395
+ },
396
+ {
397
+ "epoch": 3.064849456618564,
398
+ "grad_norm": 75.29638671875,
399
+ "learning_rate": 7.202512934220252e-05,
400
+ "loss": 3.8662,
401
+ "step": 4300
402
+ },
403
+ {
404
+ "epoch": 3.136112595759843,
405
+ "grad_norm": 60.58271789550781,
406
+ "learning_rate": 7.12860310421286e-05,
407
+ "loss": 4.2814,
408
+ "step": 4400
409
+ },
410
+ {
411
+ "epoch": 3.136112595759843,
412
+ "eval_loss": 0.1134875938296318,
413
+ "eval_runtime": 150.6507,
414
+ "eval_samples_per_second": 3.319,
415
+ "eval_steps_per_second": 0.418,
416
+ "eval_wer": 0.23017978190391983,
417
+ "step": 4400
418
  }
419
  ],
420
  "logging_steps": 100,
421
+ "max_steps": 14030,
422
  "num_input_tokens_seen": 0,
423
+ "num_train_epochs": 10,
424
  "save_steps": 400,
425
  "stateful_callbacks": {
426
  "TrainerControl": {
 
429
  "should_evaluate": false,
430
  "should_log": false,
431
  "should_save": true,
432
+ "should_training_stop": false
433
  },
434
  "attributes": {}
435
  }
436
  },
437
+ "total_flos": 5.72125660839936e+18,
438
  "train_batch_size": 8,
439
  "trial_name": null,
440
  "trial_params": null
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:571d625a4025cbdd828f3e43d1e551c2865cdc3710a18660b39ca61e19f78063
3
- size 5496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2625b2ae202938153fb64f2a01d19411a432d88aa0bb47eeca4b758e05077415
3
+ size 5560