Training in progress, step 33740, checkpoint

Files changed (6) hide show

last-checkpoint/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:23ef42a9fc9233dcc343084f9ce7d93482fb05b80136c44f06eb62dce740e1e1
 size 223144592

 version https://git-lfs.github.com/spec/v1
+oid sha256:cfbf3330733366f480058f4acc43f4b33bcf90be58f6148c9e7ba9e9cc16556b
 size 223144592

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:32c869cc0994601b8230c0fb7be3b823eef4092219ab8cbfc386196f812e2946
 size 281574266

 version https://git-lfs.github.com/spec/v1
+oid sha256:b0baa87b6a20f5da63804deb476e869325bdd38434d4801e9ff754af510fe1f2
 size 281574266

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d3c799733816fb8c27de7a857b6166730dd1c37c89ae2ebf9b77cbef47bdf09b
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:c8057494ce92a550bfad621d8189c19e910a6d4abd86bbe1cf6f59d4e3d4ca54
 size 14244

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f0ca45c6ca9d8e60f0da01fa0c96188461c4c1df90a4d99312ba8b2c40b8e0f3
 size 988

 version https://git-lfs.github.com/spec/v1
+oid sha256:fb779461c157e920976902f7e10da553ef08690b8cb1e678f1ad0ceb27b3b0a1
 size 988

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3625cf5c5369228475174d4f84a602898f6a11c9e59317a786848cd0367b3ce2
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:ce728e16d5ac03050b00527a8e1a90dc74db0b69a4e3e2d0415dc2af3e021509
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -2,9 +2,9 @@
   "best_global_step": 4000,
   "best_metric": 0.18950781019746538,
   "best_model_checkpoint": "./distil-whisper/checkpoint-4000",
-  "epoch": 19.91701244813278,
   "eval_steps": 400,
-  "global_step": 33600,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -3116,6 +3116,13 @@
       "eval_steps_per_second": 0.423,
       "eval_wer": 0.2002652519893899,
       "step": 33600
     }
   ],
   "logging_steps": 100,
@@ -3130,12 +3137,12 @@
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": false
       },
       "attributes": {}
     }
   },
-  "total_flos": 4.370219393089536e+19,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null

   "best_global_step": 4000,
   "best_metric": 0.18950781019746538,
   "best_model_checkpoint": "./distil-whisper/checkpoint-4000",
+  "epoch": 20.0,
   "eval_steps": 400,
+  "global_step": 33740,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_steps_per_second": 0.423,
       "eval_wer": 0.2002652519893899,
       "step": 33600
+    },
+    {
+      "epoch": 19.97628927089508,
+      "grad_norm": 6.524932861328125,
+      "learning_rate": 1.7448856799037304e-07,
+      "loss": 0.8792,
+      "step": 33700
     }
   ],
   "logging_steps": 100,
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": true
       },
       "attributes": {}
     }
   },
+  "total_flos": 4.38840243781632e+19,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null