Baselhany commited on
Commit
3239eae
·
verified ·
1 Parent(s): 047878a

Training in progress, step 25200, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c736fd594c380dd002a6342fa0604bc644313aed80303796815ff4b03e46442e
3
  size 223144592
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:781ba7beccdb6f2de672bde036b555a9c2452f37617312f1ada22f7dd95b7516
3
  size 223144592
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a3e2b9eff304abf490d045d1420af73881798301b076f854de745fb8bb32c5f5
3
  size 281574266
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70b435d6180ac5725ee8b276e9d4bcd3f744ed2b2d69e97b908f1fc38b66b25f
3
  size 281574266
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e2eaa69a43fe9ca74e4bd1e79b0bbd6af7b0c407425e6e1e3b18bd47b766849b
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72a46adf461123b3c04c2270eadae64d4ce1b5a208dd5fc2b1d415269f53fe47
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e15e488492623c161675a7bb297a1a2ecfcf210cea79271160fd0a257b5fa31e
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b21eaeb6df3448a126aa3c865471f11d93d5da05e32d2b0b19d5120cef1d8306
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fd454cefdd5cc5bafc5dee97883508d8606ab9e8e2795ebeb6c8caeb65187032
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b54547c361b34cbfc85f7276b4e56c67fff255001445cd0390ae05eba8160d38
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 4000,
3
  "best_metric": 0.18950781019746538,
4
  "best_model_checkpoint": "./distil-whisper/checkpoint-4000",
5
- "epoch": 14.700652045050385,
6
  "eval_steps": 400,
7
- "global_step": 24800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -2302,6 +2302,43 @@
2302
  "eval_steps_per_second": 0.429,
2303
  "eval_wer": 0.20085470085470086,
2304
  "step": 24800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2305
  }
2306
  ],
2307
  "logging_steps": 100,
@@ -2321,7 +2358,7 @@
2321
  "attributes": {}
2322
  }
2323
  },
2324
- "total_flos": 3.225638800982016e+19,
2325
  "train_batch_size": 8,
2326
  "trial_name": null,
2327
  "trial_params": null
 
2
  "best_global_step": 4000,
3
  "best_metric": 0.18950781019746538,
4
  "best_model_checkpoint": "./distil-whisper/checkpoint-4000",
5
+ "epoch": 14.937759336099585,
6
  "eval_steps": 400,
7
+ "global_step": 25200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
2302
  "eval_steps_per_second": 0.429,
2303
  "eval_wer": 0.20085470085470086,
2304
  "step": 24800
2305
+ },
2306
+ {
2307
+ "epoch": 14.759928867812686,
2308
+ "grad_norm": 8.114453315734863,
2309
+ "learning_rate": 1.689175569441645e-06,
2310
+ "loss": 0.8946,
2311
+ "step": 24900
2312
+ },
2313
+ {
2314
+ "epoch": 14.819205690574986,
2315
+ "grad_norm": 8.182477951049805,
2316
+ "learning_rate": 1.2860310421286033e-06,
2317
+ "loss": 0.9534,
2318
+ "step": 25000
2319
+ },
2320
+ {
2321
+ "epoch": 14.878482513337286,
2322
+ "grad_norm": 6.653454303741455,
2323
+ "learning_rate": 8.828865148155615e-07,
2324
+ "loss": 0.9688,
2325
+ "step": 25100
2326
+ },
2327
+ {
2328
+ "epoch": 14.937759336099585,
2329
+ "grad_norm": 9.1705322265625,
2330
+ "learning_rate": 4.837734327756501e-07,
2331
+ "loss": 0.8976,
2332
+ "step": 25200
2333
+ },
2334
+ {
2335
+ "epoch": 14.937759336099585,
2336
+ "eval_loss": 0.08782143890857697,
2337
+ "eval_runtime": 149.7053,
2338
+ "eval_samples_per_second": 3.34,
2339
+ "eval_steps_per_second": 0.421,
2340
+ "eval_wer": 0.20159151193633953,
2341
+ "step": 25200
2342
  }
2343
  ],
2344
  "logging_steps": 100,
 
2358
  "attributes": {}
2359
  }
2360
  },
2361
+ "total_flos": 3.277671658684416e+19,
2362
  "train_batch_size": 8,
2363
  "trial_name": null,
2364
  "trial_params": null