Training in progress, step 51210, checkpoint

Files changed (6) hide show

last-checkpoint/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3319e82e3a312fa6faba8a237003ca93f3ecdd36457f19215227deb690e99af7
 size 223144592

 version https://git-lfs.github.com/spec/v1
+oid sha256:37c60fec1d61a715abc34621b50732bb6b292b703f3afc3223e3e83424c74ab7
 size 223144592

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:aa51d384b7f561bf1e67da73024206fffa4e8dda22efaad2fab35ebc2b490555
 size 281574266

 version https://git-lfs.github.com/spec/v1
+oid sha256:4b66491803298bd494de49c07185852ace2b4947178790cf4fa9c4e8672a271e
 size 281574266

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:77f7aee25049de87d8cdf4f74b8e35dd47f80345ce100bfb1c453db7271d2eae
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:81b07648b78bb7a2992c7dd8ed36fd94978c5a54d9b9e494eed5b57a0c11e7e7
 size 14244

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:aa84d3b0b595baf750d6ab584421db48e3a346e0b07a20e76b7ce6ee4aa3ec8b
 size 988

 version https://git-lfs.github.com/spec/v1
+oid sha256:8ece15461d3df986ea66e8c68a5924ba82a155ca2f8c576aeb5dbb460a0585e0
 size 988

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:242d37357dc73797e49eb5568ec9ca45b32042b44f1e8681ac659f27ecd237fb
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:3798d28e55ce039da2d5ff96e3dde65a999d6fa0cc557856baaa4f2f9f004976
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -2,9 +2,9 @@
   "best_global_step": 28000,
   "best_metric": 0.18110816386678455,
   "best_model_checkpoint": "./distil-whisper/checkpoint-28000",
-  "epoch": 29.876977152899823,
   "eval_steps": 1000,
-  "global_step": 51000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -4037,6 +4037,20 @@
       "eval_steps_per_second": 0.434,
       "eval_wer": 0.18980253463012084,
       "step": 51000
     }
   ],
   "logging_steps": 100,
@@ -4051,12 +4065,12 @@
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": false
       },
       "attributes": {}
     }
   },
-  "total_flos": 6.633717809283072e+19,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null

   "best_global_step": 28000,
   "best_metric": 0.18110816386678455,
   "best_model_checkpoint": "./distil-whisper/checkpoint-28000",
+  "epoch": 30.0,
   "eval_steps": 1000,
+  "global_step": 51210,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_steps_per_second": 0.434,
       "eval_wer": 0.18980253463012084,
       "step": 51000
+    },
+    {
+      "epoch": 29.935559461042764,
+      "grad_norm": 4.774900436401367,
+      "learning_rate": 2.6424768290278054e-07,
+      "loss": 0.6359,
+      "step": 51100
+    },
+    {
+      "epoch": 29.994141769185706,
+      "grad_norm": 4.431262493133545,
+      "learning_rate": 6.704791954249655e-08,
+      "loss": 0.6618,
+      "step": 51200
     }
   ],
   "logging_steps": 100,
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": true
       },
       "attributes": {}
     }
   },
+  "total_flos": 6.6610187993088e+19,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null