Spaces:
Sleeping
Sleeping
| import whisper | |
| import yt_dlp | |
| import gradio as gr | |
| import os | |
| import re | |
| import logging | |
| logging.basicConfig(level=logging.INFO) | |
| model = whisper.load_model("medium") | |
| def get_text(url): | |
| #try: | |
| if url != '': | |
| output_text_transcribe = '' | |
| with yt_dlp.YoutubeDL({'format': 'bestaudio', 'audio-format': 'wav', 'outtmpl': '%(id)s.%(ext)s'}) as ydl: | |
| # Extract information from the given YouTube URL and download the best audio format available | |
| info_dict = ydl.extract_info(url, download=True) | |
| # Prepare the filename of the downloaded audio file | |
| audio_file = ydl.prepare_filename(info_dict) #finally: | |
| # raise gr.Error("Exception: There was a problem transcribing the audio.") | |
| result = model.transcribe(audio_file, task="transcribe") | |
| return result['text'].strip() | |
| with gr.Blocks() as demo: | |
| gr.Markdown("<h1><center>YouTube Video-to-Text using Whisper</center></h1>") | |
| gr.Markdown("<center>Enter the link of any YouTube video to generate a text transcript of the video.</center>") | |
| input_text_url = gr.Textbox(placeholder='Youtube video URL', label='YouTube URL') | |
| result_button_transcribe = gr.Button('Transcribe') | |
| output_text_transcribe = gr.Textbox(placeholder='Transcript of the YouTube video.', label='Transcript') | |
| result_button_transcribe.click(get_text, inputs = input_text_url, outputs = output_text_transcribe) | |
| demo.launch() |