Baselhany commited on
Commit
778946d
·
verified ·
1 Parent(s): 820cadb

Training in progress, step 14000, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2acb4494239e0f2939b3554b19b44da1666640d4f17fee2602fc2f73e90c86a2
3
  size 223144592
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aac2c722661dfc970b5b362fbdfe7348728114256cbf16c80817c6883bccfc3c
3
  size 223144592
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e09793699a5f80b3df4ba07dbf1ff576b3a0280feb3ad0da5b0b59817e93f5ca
3
  size 281574266
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6ebd804fbe71863b75c6e04deb067d66c945809a3503b78c812931908581ff7
3
  size 281574266
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8dc4c3096e3335993cba70f84f7c74e0bdefbe1836fe1f21fd4c7db981a15d18
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fef3f536e40043cb197cbf070d1d05bc7d1e4addbc3323ceb593a92b77a5ed05
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d13fec0d58a698a1588dfadf5d00d4fb69b490cb8fc2864fda3b2a2af6f17146
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe901f3488345253ab27036dffafec4bebac63e87632ab024a1c268eea13b76c
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:45c8cf259ef238a9913feac351553475b48cc5d3f6153c06161cc934160ae3d6
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7dd03a3ec49e4f6d8256968a34ec8adb177fe3d2cfce1011557149c70298286
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 7200,
3
  "best_metric": 0.2094017094017094,
4
  "best_model_checkpoint": "./distil-whisper/checkpoint-7200",
5
- "epoch": 9.68911455549617,
6
  "eval_steps": 400,
7
- "global_step": 13600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -1266,6 +1266,43 @@
1266
  "eval_steps_per_second": 0.435,
1267
  "eval_wer": 0.2163277335691129,
1268
  "step": 13600
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1269
  }
1270
  ],
1271
  "logging_steps": 100,
@@ -1285,7 +1322,7 @@
1285
  "attributes": {}
1286
  }
1287
  },
1288
- "total_flos": 1.768174066335744e+19,
1289
  "train_batch_size": 8,
1290
  "trial_name": null,
1291
  "trial_params": null
 
2
  "best_global_step": 7200,
3
  "best_metric": 0.2094017094017094,
4
  "best_model_checkpoint": "./distil-whisper/checkpoint-7200",
5
+ "epoch": 9.974167112061286,
6
  "eval_steps": 400,
7
+ "global_step": 14000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
1266
  "eval_steps_per_second": 0.435,
1267
  "eval_wer": 0.2163277335691129,
1268
  "step": 13600
1269
+ },
1270
+ {
1271
+ "epoch": 9.760377694637448,
1272
+ "grad_norm": 26.84296417236328,
1273
+ "learning_rate": 2.549889135254989e-06,
1274
+ "loss": 1.7145,
1275
+ "step": 13700
1276
+ },
1277
+ {
1278
+ "epoch": 9.831640833778728,
1279
+ "grad_norm": 22.363689422607422,
1280
+ "learning_rate": 1.8107908351810791e-06,
1281
+ "loss": 1.691,
1282
+ "step": 13800
1283
+ },
1284
+ {
1285
+ "epoch": 9.902903972920008,
1286
+ "grad_norm": 13.84276008605957,
1287
+ "learning_rate": 1.0716925351071693e-06,
1288
+ "loss": 1.5786,
1289
+ "step": 13900
1290
+ },
1291
+ {
1292
+ "epoch": 9.974167112061286,
1293
+ "grad_norm": 14.124626159667969,
1294
+ "learning_rate": 3.3259423503325944e-07,
1295
+ "loss": 1.6427,
1296
+ "step": 14000
1297
+ },
1298
+ {
1299
+ "epoch": 9.974167112061286,
1300
+ "eval_loss": 0.10011343657970428,
1301
+ "eval_runtime": 145.0395,
1302
+ "eval_samples_per_second": 3.447,
1303
+ "eval_steps_per_second": 0.434,
1304
+ "eval_wer": 0.21573828470380194,
1305
+ "step": 14000
1306
  }
1307
  ],
1308
  "logging_steps": 100,
 
1322
  "attributes": {}
1323
  }
1324
  },
1325
+ "total_flos": 1.820206924038144e+19,
1326
  "train_batch_size": 8,
1327
  "trial_name": null,
1328
  "trial_params": null