oluwagbotty commited on
Commit
9de7d44
·
verified ·
1 Parent(s): ec1fad2

Training in progress, step 4500, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0df53010fbda674d66d4e7bc9ec5ddc0a9d670bb01914b6ea6d1b3de14f8b08d
3
  size 151061672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe6340c896a7c2c061df0dd733b5cf530a152b2532fd7a214b42dfcd66d3dcca
3
  size 151061672
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:63c6a670910fe12d16745356d07433dfcc6ac6ea8edc3cb256b71fe86054182e
3
  size 302227787
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81902ac01d8aa613a26aa6114cce08cf29471cd8ff9696ad67e2ddcd60f2d64b
3
  size 302227787
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2a7dfa59f323bb7227795999d0c7cb18a2c95f21da91866b640cb672e937307b
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2fb9a2d94090c8b7124c6a39ee5f76482a7830faab97d12a16276fa23c8b2793
3
  size 14645
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9d0fc538266fee5c306edf72b32800812ba484b4157c432f9c91b1ab8fe68284
3
  size 1383
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06c5c8055f75339b21a661c9cb8f3a65736faa1a59a4e03ad8836f33d9e6ab5f
3
  size 1383
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4624c8f27770eb1a16767e932c8100ec43af2360d1e792bedb1826eaf2f685b3
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:426baa7f553935a148ab2ac05c277463a9fe7b24ac5c757cfb9a99895ed184c1
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 3000,
3
  "best_metric": 0.703578531742096,
4
  "best_model_checkpoint": "./openai/whisper-tiny-sid-waxal/checkpoint-3000",
5
- "epoch": 3.341687552213868,
6
  "eval_steps": 500,
7
- "global_step": 4000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -1208,6 +1208,156 @@
1208
  "eval_steps_per_second": 0.506,
1209
  "eval_wer": 0.42202241587121264,
1210
  "step": 4000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1211
  }
1212
  ],
1213
  "logging_steps": 25,
@@ -1222,7 +1372,7 @@
1222
  "early_stopping_threshold": 0.0
1223
  },
1224
  "attributes": {
1225
- "early_stopping_patience_counter": 2
1226
  }
1227
  },
1228
  "TrainerControl": {
@@ -1231,12 +1381,12 @@
1231
  "should_evaluate": false,
1232
  "should_log": false,
1233
  "should_save": true,
1234
- "should_training_stop": false
1235
  },
1236
  "attributes": {}
1237
  }
1238
  },
1239
- "total_flos": 3.15040487215104e+18,
1240
  "train_batch_size": 32,
1241
  "trial_name": null,
1242
  "trial_params": null
 
2
  "best_global_step": 3000,
3
  "best_metric": 0.703578531742096,
4
  "best_model_checkpoint": "./openai/whisper-tiny-sid-waxal/checkpoint-3000",
5
+ "epoch": 3.7593984962406015,
6
  "eval_steps": 500,
7
+ "global_step": 4500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
1208
  "eval_steps_per_second": 0.506,
1209
  "eval_wer": 0.42202241587121264,
1210
  "step": 4000
1211
+ },
1212
+ {
1213
+ "epoch": 3.3625730994152048,
1214
+ "grad_norm": 3.37201189994812,
1215
+ "learning_rate": 9.004800903699521e-05,
1216
+ "loss": 0.40936187744140623,
1217
+ "step": 4025
1218
+ },
1219
+ {
1220
+ "epoch": 3.3834586466165413,
1221
+ "grad_norm": 2.939957618713379,
1222
+ "learning_rate": 8.997740751200226e-05,
1223
+ "loss": 0.4089693832397461,
1224
+ "step": 4050
1225
+ },
1226
+ {
1227
+ "epoch": 3.4043441938178782,
1228
+ "grad_norm": 3.129723072052002,
1229
+ "learning_rate": 8.990680598700933e-05,
1230
+ "loss": 0.4094087219238281,
1231
+ "step": 4075
1232
+ },
1233
+ {
1234
+ "epoch": 3.4252297410192147,
1235
+ "grad_norm": 3.143145799636841,
1236
+ "learning_rate": 8.983620446201638e-05,
1237
+ "loss": 0.41129344940185547,
1238
+ "step": 4100
1239
+ },
1240
+ {
1241
+ "epoch": 3.4461152882205512,
1242
+ "grad_norm": 2.852447032928467,
1243
+ "learning_rate": 8.976560293702345e-05,
1244
+ "loss": 0.4309309768676758,
1245
+ "step": 4125
1246
+ },
1247
+ {
1248
+ "epoch": 3.467000835421888,
1249
+ "grad_norm": 3.04453182220459,
1250
+ "learning_rate": 8.96950014120305e-05,
1251
+ "loss": 0.4245978546142578,
1252
+ "step": 4150
1253
+ },
1254
+ {
1255
+ "epoch": 3.4878863826232247,
1256
+ "grad_norm": 3.4194531440734863,
1257
+ "learning_rate": 8.962439988703757e-05,
1258
+ "loss": 0.41548053741455077,
1259
+ "step": 4175
1260
+ },
1261
+ {
1262
+ "epoch": 3.5087719298245617,
1263
+ "grad_norm": 2.7085516452789307,
1264
+ "learning_rate": 8.955379836204463e-05,
1265
+ "loss": 0.42301589965820313,
1266
+ "step": 4200
1267
+ },
1268
+ {
1269
+ "epoch": 3.529657477025898,
1270
+ "grad_norm": 2.965217113494873,
1271
+ "learning_rate": 8.948319683705169e-05,
1272
+ "loss": 0.4241177749633789,
1273
+ "step": 4225
1274
+ },
1275
+ {
1276
+ "epoch": 3.5505430242272347,
1277
+ "grad_norm": 3.2024154663085938,
1278
+ "learning_rate": 8.941259531205874e-05,
1279
+ "loss": 0.4297440338134766,
1280
+ "step": 4250
1281
+ },
1282
+ {
1283
+ "epoch": 3.571428571428571,
1284
+ "grad_norm": 2.9695773124694824,
1285
+ "learning_rate": 8.93419937870658e-05,
1286
+ "loss": 0.3943584442138672,
1287
+ "step": 4275
1288
+ },
1289
+ {
1290
+ "epoch": 3.592314118629908,
1291
+ "grad_norm": 3.200519561767578,
1292
+ "learning_rate": 8.927139226207286e-05,
1293
+ "loss": 0.4294881820678711,
1294
+ "step": 4300
1295
+ },
1296
+ {
1297
+ "epoch": 3.6131996658312446,
1298
+ "grad_norm": 2.9448063373565674,
1299
+ "learning_rate": 8.920079073707993e-05,
1300
+ "loss": 0.4301759338378906,
1301
+ "step": 4325
1302
+ },
1303
+ {
1304
+ "epoch": 3.6340852130325816,
1305
+ "grad_norm": 3.1099841594696045,
1306
+ "learning_rate": 8.913018921208699e-05,
1307
+ "loss": 0.42306079864501955,
1308
+ "step": 4350
1309
+ },
1310
+ {
1311
+ "epoch": 3.654970760233918,
1312
+ "grad_norm": 3.556462049484253,
1313
+ "learning_rate": 8.905958768709405e-05,
1314
+ "loss": 0.42727806091308596,
1315
+ "step": 4375
1316
+ },
1317
+ {
1318
+ "epoch": 3.6758563074352546,
1319
+ "grad_norm": 3.5050208568573,
1320
+ "learning_rate": 8.898898616210111e-05,
1321
+ "loss": 0.42058845520019533,
1322
+ "step": 4400
1323
+ },
1324
+ {
1325
+ "epoch": 3.6967418546365916,
1326
+ "grad_norm": 3.299497365951538,
1327
+ "learning_rate": 8.891838463710817e-05,
1328
+ "loss": 0.4445077514648437,
1329
+ "step": 4425
1330
+ },
1331
+ {
1332
+ "epoch": 3.717627401837928,
1333
+ "grad_norm": 3.4903392791748047,
1334
+ "learning_rate": 8.884778311211522e-05,
1335
+ "loss": 0.43223350524902343,
1336
+ "step": 4450
1337
+ },
1338
+ {
1339
+ "epoch": 3.738512949039265,
1340
+ "grad_norm": 3.2760531902313232,
1341
+ "learning_rate": 8.877718158712229e-05,
1342
+ "loss": 0.41040069580078126,
1343
+ "step": 4475
1344
+ },
1345
+ {
1346
+ "epoch": 3.7593984962406015,
1347
+ "grad_norm": 2.6590590476989746,
1348
+ "learning_rate": 8.870658006212934e-05,
1349
+ "loss": 0.4209041976928711,
1350
+ "step": 4500
1351
+ },
1352
+ {
1353
+ "epoch": 3.7593984962406015,
1354
+ "eval_cer": 0.10421973321402364,
1355
+ "eval_loss": 0.7152175903320312,
1356
+ "eval_runtime": 95.3684,
1357
+ "eval_samples_per_second": 32.348,
1358
+ "eval_steps_per_second": 0.514,
1359
+ "eval_wer": 0.41531705019326415,
1360
+ "step": 4500
1361
  }
1362
  ],
1363
  "logging_steps": 25,
 
1372
  "early_stopping_threshold": 0.0
1373
  },
1374
  "attributes": {
1375
+ "early_stopping_patience_counter": 3
1376
  }
1377
  },
1378
  "TrainerControl": {
 
1381
  "should_evaluate": false,
1382
  "should_log": false,
1383
  "should_save": true,
1384
+ "should_training_stop": true
1385
  },
1386
  "attributes": {}
1387
  }
1388
  },
1389
+ "total_flos": 3.54430703407104e+18,
1390
  "train_batch_size": 32,
1391
  "trial_name": null,
1392
  "trial_params": null