Training in progress, step 45000, checkpoint

Browse files

Files changed (7) hide show

last-checkpoint/model.safetensors +1 -1
last-checkpoint/optimizer.pt +1 -1
last-checkpoint/rng_state.pth +1 -1
last-checkpoint/scaler.pt +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +64 -6
last-checkpoint/training_args.bin +1 -1

last-checkpoint/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:536dba7fc2640bfa4ad663dd452c5d567e8c167eb10a63cd22ec31f811f18e52
 size 223144592

 version https://git-lfs.github.com/spec/v1
+oid sha256:a568e96942cd89d7314e0d976df15beb19a7b31b7a80ad573473c86d1302e93c
 size 223144592

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d19b0dcd9da6f13cd9ad0dd993bfc687a2bdf56f7e214d88c765818897bab823
 size 281574266

 version https://git-lfs.github.com/spec/v1
+oid sha256:567de69fd0ba1c4c7a9a8ffc136ab6ca0803415a38b7fe06415d067f7858636e
 size 281574266

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d5935b0f811da736a5e0dd5d8910bf0435f820e6988c2171722e97cd03bc81ff
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:1b8b7531b1fc5b902cb75ca7a9dbdcd9897897bf6bc1fc2723033a58a96c2172
 size 14244

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:52e59564ead0405ff0eb4172f7953b666c269a959805a078abd715061080a7d1
 size 988

 version https://git-lfs.github.com/spec/v1
+oid sha256:1b5d546b2fffc3da93a4aa8da01e4de08986619d071e84b750436edd9eb12f37
 size 988

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1224653c609522db6a1a58ae89980b913b89e2d2dbcd6d2b06012cb14e5e2e51
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:3757dbe7156f5bc61a69d443c6dc83b53c9ebd7e6ededa1da92af126d09a6c57
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -2,9 +2,9 @@
   "best_global_step": 28000,
   "best_metric": 0.18110816386678455,
   "best_model_checkpoint": "./distil-whisper/checkpoint-28000",
-  "epoch": 26.0,
   "eval_steps": 1000,
-  "global_step": 44382,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -3505,12 +3505,70 @@
       "learning_rate": 2.3699922519484072e-07,
       "loss": 0.6662,
       "step": 44300
     }
   ],
   "logging_steps": 100,
-  "max_steps": 44382,
   "num_input_tokens_seen": 0,
-  "num_train_epochs": 26,
   "save_steps": 1000,
   "stateful_callbacks": {
     "TrainerControl": {
@@ -3519,12 +3577,12 @@
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": true
       },
       "attributes": {}
     }
   },
-  "total_flos": 5.77288295940096e+19,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null

   "best_global_step": 28000,
   "best_metric": 0.18110816386678455,
   "best_model_checkpoint": "./distil-whisper/checkpoint-28000",
+  "epoch": 26.362038664323375,
   "eval_steps": 1000,
+  "global_step": 45000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 2.3699922519484072e-07,
       "loss": 0.6662,
       "step": 44300
+    },
+    {
+      "epoch": 26.010544815465728,
+      "grad_norm": 5.860207557678223,
+      "learning_rate": 1.3472687832774603e-05,
+      "loss": 0.6097,
+      "step": 44400
+    },
+    {
+      "epoch": 26.06912712360867,
+      "grad_norm": 5.674122333526611,
+      "learning_rate": 1.3275488069414319e-05,
+      "loss": 0.6638,
+      "step": 44500
+    },
+    {
+      "epoch": 26.12770943175161,
+      "grad_norm": 7.24979829788208,
+      "learning_rate": 1.3078288306054034e-05,
+      "loss": 0.641,
+      "step": 44600
+    },
+    {
+      "epoch": 26.186291739894553,
+      "grad_norm": 7.524514198303223,
+      "learning_rate": 1.288108854269375e-05,
+      "loss": 0.6722,
+      "step": 44700
+    },
+    {
+      "epoch": 26.24487404803749,
+      "grad_norm": 5.542699337005615,
+      "learning_rate": 1.2683888779333466e-05,
+      "loss": 0.6386,
+      "step": 44800
+    },
+    {
+      "epoch": 26.303456356180433,
+      "grad_norm": 7.757282257080078,
+      "learning_rate": 1.2486689015973181e-05,
+      "loss": 0.6976,
+      "step": 44900
+    },
+    {
+      "epoch": 26.362038664323375,
+      "grad_norm": 5.828668117523193,
+      "learning_rate": 1.2289489252612897e-05,
+      "loss": 0.6921,
+      "step": 45000
+    },
+    {
+      "epoch": 26.362038664323375,
+      "eval_loss": 0.08329325169324875,
+      "eval_runtime": 154.0108,
+      "eval_samples_per_second": 3.247,
+      "eval_steps_per_second": 0.409,
+      "eval_wer": 0.18803418803418803,
+      "step": 45000
     }
   ],
   "logging_steps": 100,
+  "max_steps": 51210,
   "num_input_tokens_seen": 0,
+  "num_train_epochs": 30,
   "save_steps": 1000,
   "stateful_callbacks": {
     "TrainerControl": {
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": false
       },
       "attributes": {}
     }
   },
+  "total_flos": 5.853273724551168e+19,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null

last-checkpoint/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:53497c2a30fa39789de3f94cd648f2d8f2aac1e98751a369793ae553fcdcb336
 size 5496

 version https://git-lfs.github.com/spec/v1
+oid sha256:a4c57ccff6bf7086a307311fd25098672bae7b0308bc8beda9e8aefc9f99378d
 size 5496