Baselhany commited on
Commit
2bb6c9c
·
verified ·
1 Parent(s): 42eaa3a

Training in progress, step 35200, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:64a6ce10d6ee49594542cb9eaca3963c0482775bfd195eea607a3b736d78630a
3
  size 223144592
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:818a7679981fc0ec6b47bc6758933a6dc132a23ee5ac3054d56cc5a02cae3823
3
  size 223144592
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d185225ac64619e124c6d9a6588368052687171f0fd09697c97d959b8b7b8446
3
  size 281574266
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9e5378dfcfea31740c5b7fb988286fd4bf67acbbc58e4606cdc734ac572db2b
3
  size 281574266
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d87af18a0ac400d5d7de573010763f26b618db06bc838e54c97a8a6021751ee0
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1731ada7b53548acf7cfef80e6885ccc9e9454a0d4ede7ecdb3292b69f9b12c
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9da6023d3cd3bc79a91dfa184f82a453ac8795f05efb38449981d90d67cc96be
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3cf2f2f33b761e05038aa7a32c6a962768e656e6c0b0cd6ae9ff4e21de8efc51
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d3a13ff7879bb8d709a5e0a7153f659f171dd934fb7ae287fad4c641e9505c2a
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:869f259955307b28b00caecffc65d71770edc3cd19a8aba433aa1938286d15b5
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 32400,
3
  "best_metric": 0.19510757441791923,
4
  "best_model_checkpoint": "./distil-whisper/checkpoint-32400",
5
- "epoch": 24.999821842152148,
6
  "eval_steps": 400,
7
- "global_step": 35075,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -3241,12 +3241,35 @@
3241
  "learning_rate": 2.74765003615329e-07,
3242
  "loss": 0.9673,
3243
  "step": 35000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3244
  }
3245
  ],
3246
  "logging_steps": 100,
3247
- "max_steps": 35075,
3248
  "num_input_tokens_seen": 0,
3249
- "num_train_epochs": 25,
3250
  "save_steps": 400,
3251
  "stateful_callbacks": {
3252
  "TrainerControl": {
@@ -3255,12 +3278,12 @@
3255
  "should_evaluate": false,
3256
  "should_log": false,
3257
  "should_save": true,
3258
- "should_training_stop": true
3259
  },
3260
  "attributes": {}
3261
  }
3262
  },
3263
- "total_flos": 4.560167779172352e+19,
3264
  "train_batch_size": 8,
3265
  "trial_name": null,
3266
  "trial_params": null
 
2
  "best_global_step": 32400,
3
  "best_metric": 0.19510757441791923,
4
  "best_model_checkpoint": "./distil-whisper/checkpoint-32400",
5
+ "epoch": 25.0890789239266,
6
  "eval_steps": 400,
7
+ "global_step": 35200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
3241
  "learning_rate": 2.74765003615329e-07,
3242
  "loss": 0.9673,
3243
  "step": 35000
3244
+ },
3245
+ {
3246
+ "epoch": 25.01781578478532,
3247
+ "grad_norm": 15.058631896972656,
3248
+ "learning_rate": 1.6855013224332772e-05,
3249
+ "loss": 0.9582,
3250
+ "step": 35100
3251
+ },
3252
+ {
3253
+ "epoch": 25.0890789239266,
3254
+ "grad_norm": 11.464241027832031,
3255
+ "learning_rate": 1.6614570810290935e-05,
3256
+ "loss": 1.0316,
3257
+ "step": 35200
3258
+ },
3259
+ {
3260
+ "epoch": 25.0890789239266,
3261
+ "eval_loss": 0.09259089827537537,
3262
+ "eval_runtime": 149.1152,
3263
+ "eval_samples_per_second": 3.353,
3264
+ "eval_steps_per_second": 0.422,
3265
+ "eval_wer": 0.19834954317712938,
3266
+ "step": 35200
3267
  }
3268
  ],
3269
  "logging_steps": 100,
3270
+ "max_steps": 42090,
3271
  "num_input_tokens_seen": 0,
3272
+ "num_train_epochs": 30,
3273
  "save_steps": 400,
3274
  "stateful_callbacks": {
3275
  "TrainerControl": {
 
3278
  "should_evaluate": false,
3279
  "should_log": false,
3280
  "should_save": true,
3281
+ "should_training_stop": false
3282
  },
3283
  "attributes": {}
3284
  }
3285
  },
3286
+ "total_flos": 4.576428047204352e+19,
3287
  "train_batch_size": 8,
3288
  "trial_name": null,
3289
  "trial_params": null
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bcc91c48d709e41f00ac682ba95a79e6330091c0de4c16618cd675c3045498dd
3
  size 5496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0927f54d878c4d2e9484c5d1a3a658a65404a12eac5670f7cfd2ede0ae057700
3
  size 5496