Instructions to use waxal-benchmarking/whisper-tiny-sid-Oreoluwa with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- Transformers
How to use waxal-benchmarking/whisper-tiny-sid-Oreoluwa with Transformers:
# Use a pipeline as a high-level helper from transformers import pipeline pipe = pipeline("automatic-speech-recognition", model="waxal-benchmarking/whisper-tiny-sid-Oreoluwa")# Load model directly from transformers import AutoProcessor, AutoModelForSpeechSeq2Seq processor = AutoProcessor.from_pretrained("waxal-benchmarking/whisper-tiny-sid-Oreoluwa") model = AutoModelForSpeechSeq2Seq.from_pretrained("waxal-benchmarking/whisper-tiny-sid-Oreoluwa") - Notebooks
- Google Colab
- Kaggle
Training in progress, step 4500, checkpoint
Browse files
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 151061672
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fe6340c896a7c2c061df0dd733b5cf530a152b2532fd7a214b42dfcd66d3dcca
|
| 3 |
size 151061672
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 302227787
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:81902ac01d8aa613a26aa6114cce08cf29471cd8ff9696ad67e2ddcd60f2d64b
|
| 3 |
size 302227787
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14645
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2fb9a2d94090c8b7124c6a39ee5f76482a7830faab97d12a16276fa23c8b2793
|
| 3 |
size 14645
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1383
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:06c5c8055f75339b21a661c9cb8f3a65736faa1a59a4e03ad8836f33d9e6ab5f
|
| 3 |
size 1383
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1465
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:426baa7f553935a148ab2ac05c277463a9fe7b24ac5c757cfb9a99895ed184c1
|
| 3 |
size 1465
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": 3000,
|
| 3 |
"best_metric": 0.703578531742096,
|
| 4 |
"best_model_checkpoint": "./openai/whisper-tiny-sid-waxal/checkpoint-3000",
|
| 5 |
-
"epoch": 3.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -1208,6 +1208,156 @@
|
|
| 1208 |
"eval_steps_per_second": 0.506,
|
| 1209 |
"eval_wer": 0.42202241587121264,
|
| 1210 |
"step": 4000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1211 |
}
|
| 1212 |
],
|
| 1213 |
"logging_steps": 25,
|
|
@@ -1222,7 +1372,7 @@
|
|
| 1222 |
"early_stopping_threshold": 0.0
|
| 1223 |
},
|
| 1224 |
"attributes": {
|
| 1225 |
-
"early_stopping_patience_counter":
|
| 1226 |
}
|
| 1227 |
},
|
| 1228 |
"TrainerControl": {
|
|
@@ -1231,12 +1381,12 @@
|
|
| 1231 |
"should_evaluate": false,
|
| 1232 |
"should_log": false,
|
| 1233 |
"should_save": true,
|
| 1234 |
-
"should_training_stop":
|
| 1235 |
},
|
| 1236 |
"attributes": {}
|
| 1237 |
}
|
| 1238 |
},
|
| 1239 |
-
"total_flos": 3.
|
| 1240 |
"train_batch_size": 32,
|
| 1241 |
"trial_name": null,
|
| 1242 |
"trial_params": null
|
|
|
|
| 2 |
"best_global_step": 3000,
|
| 3 |
"best_metric": 0.703578531742096,
|
| 4 |
"best_model_checkpoint": "./openai/whisper-tiny-sid-waxal/checkpoint-3000",
|
| 5 |
+
"epoch": 3.7593984962406015,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 4500,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 1208 |
"eval_steps_per_second": 0.506,
|
| 1209 |
"eval_wer": 0.42202241587121264,
|
| 1210 |
"step": 4000
|
| 1211 |
+
},
|
| 1212 |
+
{
|
| 1213 |
+
"epoch": 3.3625730994152048,
|
| 1214 |
+
"grad_norm": 3.37201189994812,
|
| 1215 |
+
"learning_rate": 9.004800903699521e-05,
|
| 1216 |
+
"loss": 0.40936187744140623,
|
| 1217 |
+
"step": 4025
|
| 1218 |
+
},
|
| 1219 |
+
{
|
| 1220 |
+
"epoch": 3.3834586466165413,
|
| 1221 |
+
"grad_norm": 2.939957618713379,
|
| 1222 |
+
"learning_rate": 8.997740751200226e-05,
|
| 1223 |
+
"loss": 0.4089693832397461,
|
| 1224 |
+
"step": 4050
|
| 1225 |
+
},
|
| 1226 |
+
{
|
| 1227 |
+
"epoch": 3.4043441938178782,
|
| 1228 |
+
"grad_norm": 3.129723072052002,
|
| 1229 |
+
"learning_rate": 8.990680598700933e-05,
|
| 1230 |
+
"loss": 0.4094087219238281,
|
| 1231 |
+
"step": 4075
|
| 1232 |
+
},
|
| 1233 |
+
{
|
| 1234 |
+
"epoch": 3.4252297410192147,
|
| 1235 |
+
"grad_norm": 3.143145799636841,
|
| 1236 |
+
"learning_rate": 8.983620446201638e-05,
|
| 1237 |
+
"loss": 0.41129344940185547,
|
| 1238 |
+
"step": 4100
|
| 1239 |
+
},
|
| 1240 |
+
{
|
| 1241 |
+
"epoch": 3.4461152882205512,
|
| 1242 |
+
"grad_norm": 2.852447032928467,
|
| 1243 |
+
"learning_rate": 8.976560293702345e-05,
|
| 1244 |
+
"loss": 0.4309309768676758,
|
| 1245 |
+
"step": 4125
|
| 1246 |
+
},
|
| 1247 |
+
{
|
| 1248 |
+
"epoch": 3.467000835421888,
|
| 1249 |
+
"grad_norm": 3.04453182220459,
|
| 1250 |
+
"learning_rate": 8.96950014120305e-05,
|
| 1251 |
+
"loss": 0.4245978546142578,
|
| 1252 |
+
"step": 4150
|
| 1253 |
+
},
|
| 1254 |
+
{
|
| 1255 |
+
"epoch": 3.4878863826232247,
|
| 1256 |
+
"grad_norm": 3.4194531440734863,
|
| 1257 |
+
"learning_rate": 8.962439988703757e-05,
|
| 1258 |
+
"loss": 0.41548053741455077,
|
| 1259 |
+
"step": 4175
|
| 1260 |
+
},
|
| 1261 |
+
{
|
| 1262 |
+
"epoch": 3.5087719298245617,
|
| 1263 |
+
"grad_norm": 2.7085516452789307,
|
| 1264 |
+
"learning_rate": 8.955379836204463e-05,
|
| 1265 |
+
"loss": 0.42301589965820313,
|
| 1266 |
+
"step": 4200
|
| 1267 |
+
},
|
| 1268 |
+
{
|
| 1269 |
+
"epoch": 3.529657477025898,
|
| 1270 |
+
"grad_norm": 2.965217113494873,
|
| 1271 |
+
"learning_rate": 8.948319683705169e-05,
|
| 1272 |
+
"loss": 0.4241177749633789,
|
| 1273 |
+
"step": 4225
|
| 1274 |
+
},
|
| 1275 |
+
{
|
| 1276 |
+
"epoch": 3.5505430242272347,
|
| 1277 |
+
"grad_norm": 3.2024154663085938,
|
| 1278 |
+
"learning_rate": 8.941259531205874e-05,
|
| 1279 |
+
"loss": 0.4297440338134766,
|
| 1280 |
+
"step": 4250
|
| 1281 |
+
},
|
| 1282 |
+
{
|
| 1283 |
+
"epoch": 3.571428571428571,
|
| 1284 |
+
"grad_norm": 2.9695773124694824,
|
| 1285 |
+
"learning_rate": 8.93419937870658e-05,
|
| 1286 |
+
"loss": 0.3943584442138672,
|
| 1287 |
+
"step": 4275
|
| 1288 |
+
},
|
| 1289 |
+
{
|
| 1290 |
+
"epoch": 3.592314118629908,
|
| 1291 |
+
"grad_norm": 3.200519561767578,
|
| 1292 |
+
"learning_rate": 8.927139226207286e-05,
|
| 1293 |
+
"loss": 0.4294881820678711,
|
| 1294 |
+
"step": 4300
|
| 1295 |
+
},
|
| 1296 |
+
{
|
| 1297 |
+
"epoch": 3.6131996658312446,
|
| 1298 |
+
"grad_norm": 2.9448063373565674,
|
| 1299 |
+
"learning_rate": 8.920079073707993e-05,
|
| 1300 |
+
"loss": 0.4301759338378906,
|
| 1301 |
+
"step": 4325
|
| 1302 |
+
},
|
| 1303 |
+
{
|
| 1304 |
+
"epoch": 3.6340852130325816,
|
| 1305 |
+
"grad_norm": 3.1099841594696045,
|
| 1306 |
+
"learning_rate": 8.913018921208699e-05,
|
| 1307 |
+
"loss": 0.42306079864501955,
|
| 1308 |
+
"step": 4350
|
| 1309 |
+
},
|
| 1310 |
+
{
|
| 1311 |
+
"epoch": 3.654970760233918,
|
| 1312 |
+
"grad_norm": 3.556462049484253,
|
| 1313 |
+
"learning_rate": 8.905958768709405e-05,
|
| 1314 |
+
"loss": 0.42727806091308596,
|
| 1315 |
+
"step": 4375
|
| 1316 |
+
},
|
| 1317 |
+
{
|
| 1318 |
+
"epoch": 3.6758563074352546,
|
| 1319 |
+
"grad_norm": 3.5050208568573,
|
| 1320 |
+
"learning_rate": 8.898898616210111e-05,
|
| 1321 |
+
"loss": 0.42058845520019533,
|
| 1322 |
+
"step": 4400
|
| 1323 |
+
},
|
| 1324 |
+
{
|
| 1325 |
+
"epoch": 3.6967418546365916,
|
| 1326 |
+
"grad_norm": 3.299497365951538,
|
| 1327 |
+
"learning_rate": 8.891838463710817e-05,
|
| 1328 |
+
"loss": 0.4445077514648437,
|
| 1329 |
+
"step": 4425
|
| 1330 |
+
},
|
| 1331 |
+
{
|
| 1332 |
+
"epoch": 3.717627401837928,
|
| 1333 |
+
"grad_norm": 3.4903392791748047,
|
| 1334 |
+
"learning_rate": 8.884778311211522e-05,
|
| 1335 |
+
"loss": 0.43223350524902343,
|
| 1336 |
+
"step": 4450
|
| 1337 |
+
},
|
| 1338 |
+
{
|
| 1339 |
+
"epoch": 3.738512949039265,
|
| 1340 |
+
"grad_norm": 3.2760531902313232,
|
| 1341 |
+
"learning_rate": 8.877718158712229e-05,
|
| 1342 |
+
"loss": 0.41040069580078126,
|
| 1343 |
+
"step": 4475
|
| 1344 |
+
},
|
| 1345 |
+
{
|
| 1346 |
+
"epoch": 3.7593984962406015,
|
| 1347 |
+
"grad_norm": 2.6590590476989746,
|
| 1348 |
+
"learning_rate": 8.870658006212934e-05,
|
| 1349 |
+
"loss": 0.4209041976928711,
|
| 1350 |
+
"step": 4500
|
| 1351 |
+
},
|
| 1352 |
+
{
|
| 1353 |
+
"epoch": 3.7593984962406015,
|
| 1354 |
+
"eval_cer": 0.10421973321402364,
|
| 1355 |
+
"eval_loss": 0.7152175903320312,
|
| 1356 |
+
"eval_runtime": 95.3684,
|
| 1357 |
+
"eval_samples_per_second": 32.348,
|
| 1358 |
+
"eval_steps_per_second": 0.514,
|
| 1359 |
+
"eval_wer": 0.41531705019326415,
|
| 1360 |
+
"step": 4500
|
| 1361 |
}
|
| 1362 |
],
|
| 1363 |
"logging_steps": 25,
|
|
|
|
| 1372 |
"early_stopping_threshold": 0.0
|
| 1373 |
},
|
| 1374 |
"attributes": {
|
| 1375 |
+
"early_stopping_patience_counter": 3
|
| 1376 |
}
|
| 1377 |
},
|
| 1378 |
"TrainerControl": {
|
|
|
|
| 1381 |
"should_evaluate": false,
|
| 1382 |
"should_log": false,
|
| 1383 |
"should_save": true,
|
| 1384 |
+
"should_training_stop": true
|
| 1385 |
},
|
| 1386 |
"attributes": {}
|
| 1387 |
}
|
| 1388 |
},
|
| 1389 |
+
"total_flos": 3.54430703407104e+18,
|
| 1390 |
"train_batch_size": 32,
|
| 1391 |
"trial_name": null,
|
| 1392 |
"trial_params": null
|