Spaces:
Sleeping
Sleeping
| import gradio as gr | |
| import whisper | |
| from wordcloud import WordCloud | |
| import tempfile | |
| import os | |
| # Load the Whisper model | |
| model = whisper.load_model("base") | |
| def transcribe(audio): | |
| # Transcribe the audio file | |
| result = model.transcribe(audio) | |
| text = result['text'] | |
| # Generate a word cloud | |
| wordcloud = WordCloud(width=800, height=400, background_color='white').generate(text) | |
| # Save the word cloud image to a temporary file | |
| with tempfile.NamedTemporaryFile(delete=False, suffix='.png') as tmpfile: | |
| wordcloud.to_file(tmpfile.name) | |
| return text, tmpfile.name | |
| # Create the Gradio interface | |
| demo = gr.Interface( | |
| fn=transcribe, | |
| inputs=gr.Audio(type="filepath"), # Allow file uploads | |
| outputs=["text", gr.Image(type="filepath")], # Output both text and image | |
| title="SAUTI_V1", | |
| description="Upload an audio file to transcribe it to text and view a word cloud of the text. Disclaimer: This might run slow due to it been hosted on free tier" | |
| ) | |
| # Launch the app | |
| if __name__ == "__main__": | |
| demo.launch() |