Commit ·
f1bbf33
1
Parent(s): 32440c9
add length for faster train
Browse files
main.py
CHANGED
|
@@ -61,6 +61,8 @@ def prepare_dataset(batch, processor):
|
|
| 61 |
|
| 62 |
batch["input_values"] = processor(batch["speech"], sampling_rate=batch["sampling_rate"][0]).input_values
|
| 63 |
|
|
|
|
|
|
|
| 64 |
with processor.as_target_processor():
|
| 65 |
batch["labels"] = processor(batch["target_text"]).input_ids
|
| 66 |
return batch
|
|
|
|
| 61 |
|
| 62 |
batch["input_values"] = processor(batch["speech"], sampling_rate=batch["sampling_rate"][0]).input_values
|
| 63 |
|
| 64 |
+
batch["length"] = [len(item) for item in batch["input_values"]]
|
| 65 |
+
|
| 66 |
with processor.as_target_processor():
|
| 67 |
batch["labels"] = processor(batch["target_text"]).input_ids
|
| 68 |
return batch
|