| import transformers |
| from transformers import pipeline |
| import gradio as gr |
| import os |
| import sys |
| os.system("pip install evaluate") |
| os.system("pip install datasets") |
| os.system("pip install spicy") |
| os.system("pip install soundfile") |
| os.system("pip install datasets[audio]") |
| from evaluate import evaluator |
| from datasets import load_dataset, Audio |
|
|
|
|
| p = pipeline("automatic-speech-recognition") |
|
|
| task_evaluator = evaluator("automatic-speech-recognition") |
| |
| |
| data = load_dataset("audiofolder", data_files=["mskov/miso_test/test_set/and.wav","mskov/miso_test/test_set/chew1.wav","mskov/miso_test/test_set/chew3.wav", "mskov/miso_test/test_set/chew3.wav","mskov/miso_test/test_set/chew4.wav","mskov/miso_test/test_set/cough1.wav","mskov/miso_test/test_set/cough2.wav","mskov/miso_test/test_set/cough3.wav","mskov/miso_test/test_set/hi.wav","mskov/miso_test/test_set/knock_knock.wav","mskov/miso_test/test_set/mouth_sounds1.wav","mskov/miso_test/test_set/mouth_sounds2.wav","mskov/miso_test/test_set/no.wav","mskov/miso_test/test_set/not_bad.wav","mskov/miso_test/test_set/oh_i_wish.wav","mskov/miso_test/test_set/pop1.wav","mskov/miso_test/test_set/really.wav","mskov/miso_test/test_set/sigh1.wav","mskov/miso_test/test_set/sigh2.wav","mskov/miso_test/test_set/slurp1.wav","mskov/miso_test/test_set/slurp2.wav","mskov/miso_test/test_set/sneeze1.wav","mskov/miso_test/test_set/sneeze2.wav","mskov/miso_test/test_set/so_i_did_it_again.wav"] |
| results = task_evaluator.compute( |
| model_or_pipeline="https://huggingface.co/mskov/whisper_miso", |
| data=data, |
| input_column="file_name", |
| label_column="category", |
| metric="wer", |
| ) |
| print(results) |
|
|
|
|
| def transcribe(audio, state=""): |
| text = p(audio)["text"] |
| state += text + " " |
| return state, state |
|
|
| gr.Interface( |
| fn=transcribe, |
| inputs=[ |
| gr.Audio(source="microphone", type="filepath", streaming=True), |
| "state" |
| ], |
| outputs=[ |
| "textbox", |
| "state" |
| ], |
| live=True).launch() |
|
|