Baselhany commited on
Commit
87038cc
·
verified ·
1 Parent(s): dcc5cba

Training in progress, step 16870, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8daf519e56262574da44c0ef1b99ce20dfa6917108a4ca7ed2f9d533fdc8c1ba
3
  size 223144592
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a631f3737703c324c3c241adc703b24330e9f582b19bfd94e8d1e9b90cb7533
3
  size 223144592
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ce9deb2c7c7a8e25f17f3d650ec4d54d8887269d9c51b346d47fc9ace2e49db7
3
  size 281574266
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f809c5f2af7511f5e6d6bf53ef2df5bf6cf5684cf72732218d625f71df2ed0fc
3
  size 281574266
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ee6dca5678b882df81a5d39896646c925c7d4cb2a4c9671ace85732fa736c4f5
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7954d3f47cdc4e78510dd0477474838526e1a4a2a9e56890b6d3780e346e0928
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fc569727a87d5c1414231bcc21e5c78774f97c9039044a671a07f1c0b2ba722b
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e49f68b2e6549aea69b3c4898c5beed6fd5809222a695dedaa2327f1a9285410
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f0ec29cf1aa64cbf5f3ca0e7be0776f13fe78466f1761905213206b4277e5b76
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0717b2dd00cb179eefa3d5cab763c851639874f38293da9914ac4d2702108d48
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 4000,
3
  "best_metric": 0.18950781019746538,
4
  "best_model_checkpoint": "./distil-whisper/checkpoint-4000",
5
- "epoch": 9.95850622406639,
6
  "eval_steps": 400,
7
- "global_step": 16800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -1576,12 +1576,12 @@
1576
  "should_evaluate": false,
1577
  "should_log": false,
1578
  "should_save": true,
1579
- "should_training_stop": false
1580
  },
1581
  "attributes": {}
1582
  }
1583
  },
1584
- "total_flos": 2.185123924279296e+19,
1585
  "train_batch_size": 8,
1586
  "trial_name": null,
1587
  "trial_params": null
 
2
  "best_global_step": 4000,
3
  "best_metric": 0.18950781019746538,
4
  "best_model_checkpoint": "./distil-whisper/checkpoint-4000",
5
+ "epoch": 10.0,
6
  "eval_steps": 400,
7
+ "global_step": 16870,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
1576
  "should_evaluate": false,
1577
  "should_log": false,
1578
  "should_save": true,
1579
+ "should_training_stop": true
1580
  },
1581
  "attributes": {}
1582
  }
1583
  },
1584
+ "total_flos": 2.19420121890816e+19,
1585
  "train_batch_size": 8,
1586
  "trial_name": null,
1587
  "trial_params": null