Spaces:

MicroHealth
/

AV-to-transcripts

Paused

App Files Files Community

bluenevus commited on Apr 26, 2025

Commit

ce4312e

verified ·

1 Parent(s): 25726df

Update app.py

Browse files

Files changed (1) hide show

app.py +86 -46

app.py CHANGED Viewed

@@ -3,6 +3,7 @@ import os
 import tempfile
 import threading
 import base64
 from urllib.parse import urlparse
 import dash
@@ -16,11 +17,19 @@ from pydub import AudioSegment
 import google.generativeai as genai
 from moviepy.editor import VideoFileClip
 # Initialize the Dash app
 app = dash.Dash(__name__, external_stylesheets=[dbc.themes.BOOTSTRAP])
 # Retrieve the Google API key from Hugging Face Spaces
 GOOGLE_API_KEY = os.environ.get("GOOGLE_API_KEY")
 genai.configure(api_key=GOOGLE_API_KEY)
 # Initialize Gemini model
@@ -31,68 +40,95 @@ def is_valid_url(url):
         result = urlparse(url)
         return all([result.scheme, result.netloc])
     except ValueError:
         return False
 def download_media(url):
-    if "youtube.com" in url or "youtu.be" in url:
-        yt = YouTube(url)
-        stream = yt.streams.filter(progressive=True, file_extension='mp4').first()
-        with tempfile.NamedTemporaryFile(delete=False, suffix=".mp4") as temp_file:
-            stream.download(output_path=os.path.dirname(temp_file.name), filename=temp_file.name)
-            return temp_file.name
-    else:
-        response = requests.get(url)
-        content_type = response.headers.get('content-type', '')
-        if 'video' in content_type:
-            suffix = '.mp4'
-        elif 'audio' in content_type:
-            suffix = '.mp3'
         else:
-            suffix = ''
-        with tempfile.NamedTemporaryFile(delete=False, suffix=suffix) as temp_file:
-            temp_file.write(response.content)
-            return temp_file.name
 def extract_audio(file_path):
-    video = VideoFileClip(file_path)
-    audio = video.audio
-    audio_file = tempfile.NamedTemporaryFile(delete=False, suffix=".wav")
-    audio.write_audiofile(audio_file.name)
-    video.close()
-    audio.close()
-    return audio_file.name
 def transcribe_audio(file_path):
-    with open(file_path, "rb") as audio_file:
-        audio_data = audio_file.read()
-    response = model.generate_content(audio_data)
-    return response.text
 def process_media(contents, filename, url):
-    if contents:
-        content_type, content_string = contents.split(',')
-        decoded = base64.b64decode(content_string)
-        suffix = os.path.splitext(filename)[1]
-        with tempfile.NamedTemporaryFile(delete=False, suffix=suffix) as temp_file:
-            temp_file.write(decoded)
-            temp_file_path = temp_file.name
-    elif url:
-        temp_file_path = download_media(url)
-    else:
-        raise ValueError("No input provided")
     try:
         if temp_file_path.lower().endswith(('.mp4', '.avi', '.mov', '.flv', '.wmv')):
             audio_file_path = extract_audio(temp_file_path)
             transcript = transcribe_audio(audio_file_path)
             os.unlink(audio_file_path)
         else:
             transcript = transcribe_audio(temp_file_path)
-    finally:
-        os.unlink(temp_file_path)
-    return transcript
 app.layout = dbc.Container([
     html.H1("Audio/Video Transcription App", className="text-center my-4"),
@@ -142,6 +178,7 @@ def update_transcription(n_clicks, contents, filename, url):
         try:
             return process_media(contents, filename, url)
         except Exception as e:
             return f"An error occurred: {str(e)}"
     thread = threading.Thread(target=transcribe)
@@ -149,11 +186,13 @@ def update_transcription(n_clicks, contents, filename, url):
     thread.join(timeout=600)  # 10 minutes timeout
     if thread.is_alive():
         return "Transcription timed out after 10 minutes", {'display': 'none'}
     transcript = getattr(thread, 'result', "Transcription failed")
     if transcript and not transcript.startswith("An error occurred"):
         return dbc.Card([
             dbc.CardBody([
                 html.H5("Transcription Result"),
@@ -161,6 +200,7 @@ def update_transcription(n_clicks, contents, filename, url):
             ])
         ]), {'display': 'block'}
     else:
         return transcript, {'display': 'none'}
 @app.callback(
@@ -177,6 +217,6 @@ def download_transcript(n_clicks, transcription_output):
     return dict(content=transcript, filename="transcript.txt")
 if __name__ == '__main__':
-    print("Starting the Dash application...")
     app.run(debug=True, host='0.0.0.0', port=7860)
-    print("Dash application has finished running.")

 import tempfile
 import threading
 import base64
+import logging
 from urllib.parse import urlparse
 import dash
 import google.generativeai as genai
 from moviepy.editor import VideoFileClip
+# Set up logging
+logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
+logger = logging.getLogger(__name__)
 # Initialize the Dash app
 app = dash.Dash(__name__, external_stylesheets=[dbc.themes.BOOTSTRAP])
 # Retrieve the Google API key from Hugging Face Spaces
 GOOGLE_API_KEY = os.environ.get("GOOGLE_API_KEY")
+if not GOOGLE_API_KEY:
+    logger.error("GOOGLE_API_KEY not found in environment variables")
+    raise ValueError("GOOGLE_API_KEY not set")
 genai.configure(api_key=GOOGLE_API_KEY)
 # Initialize Gemini model
         result = urlparse(url)
         return all([result.scheme, result.netloc])
     except ValueError:
+        logger.error(f"Invalid URL: {url}")
         return False
 def download_media(url):
+    logger.info(f"Attempting to download media from URL: {url}")
+    try:
+        if "youtube.com" in url or "youtu.be" in url:
+            yt = YouTube(url)
+            stream = yt.streams.filter(progressive=True, file_extension='mp4').first()
+            with tempfile.NamedTemporaryFile(delete=False, suffix=".mp4") as temp_file:
+                stream.download(output_path=os.path.dirname(temp_file.name), filename=temp_file.name)
+                logger.info(f"YouTube video downloaded: {temp_file.name}")
+                return temp_file.name
         else:
+            response = requests.get(url)
+            content_type = response.headers.get('content-type', '')
+            if 'video' in content_type:
+                suffix = '.mp4'
+            elif 'audio' in content_type:
+                suffix = '.mp3'
+            else:
+                suffix = ''
+            with tempfile.NamedTemporaryFile(delete=False, suffix=suffix) as temp_file:
+                temp_file.write(response.content)
+                logger.info(f"Media downloaded: {temp_file.name}")
+                return temp_file.name
+    except Exception as e:
+        logger.error(f"Error downloading media: {str(e)}")
+        raise
 def extract_audio(file_path):
+    logger.info(f"Extracting audio from video: {file_path}")
+    try:
+        video = VideoFileClip(file_path)
+        audio = video.audio
+        audio_file = tempfile.NamedTemporaryFile(delete=False, suffix=".wav")
+        audio.write_audiofile(audio_file.name)
+        video.close()
+        audio.close()
+        logger.info(f"Audio extracted: {audio_file.name}")
+        return audio_file.name
+    except Exception as e:
+        logger.error(f"Error extracting audio: {str(e)}")
+        raise
 def transcribe_audio(file_path):
+    logger.info(f"Transcribing audio: {file_path}")
+    try:
+        with open(file_path, "rb") as audio_file:
+            audio_data = audio_file.read()
+        response = model.generate_content(audio_data)
+        logger.info("Transcription completed successfully")
+        return response.text
+    except Exception as e:
+        logger.error(f"Error during transcription: {str(e)}")
+        raise
 def process_media(contents, filename, url):
+    logger.info("Starting media processing")
     try:
+        if contents:
+            content_type, content_string = contents.split(',')
+            decoded = base64.b64decode(content_string)
+            suffix = os.path.splitext(filename)[1]
+            with tempfile.NamedTemporaryFile(delete=False, suffix=suffix) as temp_file:
+                temp_file.write(decoded)
+                temp_file_path = temp_file.name
+            logger.info(f"File uploaded: {temp_file_path}")
+        elif url:
+            temp_file_path = download_media(url)
+        else:
+            logger.error("No input provided")
+            raise ValueError("No input provided")
         if temp_file_path.lower().endswith(('.mp4', '.avi', '.mov', '.flv', '.wmv')):
+            logger.info("Video file detected, extracting audio")
             audio_file_path = extract_audio(temp_file_path)
             transcript = transcribe_audio(audio_file_path)
             os.unlink(audio_file_path)
         else:
+            logger.info("Audio file detected, transcribing directly")
             transcript = transcribe_audio(temp_file_path)
+        os.unlink(temp_file_path)
+        return transcript
+    except Exception as e:
+        logger.error(f"Error in process_media: {str(e)}")
+        raise
 app.layout = dbc.Container([
     html.H1("Audio/Video Transcription App", className="text-center my-4"),
         try:
             return process_media(contents, filename, url)
         except Exception as e:
+            logger.error(f"Transcription failed: {str(e)}")
             return f"An error occurred: {str(e)}"
     thread = threading.Thread(target=transcribe)
     thread.join(timeout=600)  # 10 minutes timeout
     if thread.is_alive():
+        logger.warning("Transcription timed out after 10 minutes")
         return "Transcription timed out after 10 minutes", {'display': 'none'}
     transcript = getattr(thread, 'result', "Transcription failed")
     if transcript and not transcript.startswith("An error occurred"):
+        logger.info("Transcription successful")
         return dbc.Card([
             dbc.CardBody([
                 html.H5("Transcription Result"),
             ])
         ]), {'display': 'block'}
     else:
+        logger.error(f"Transcription failed: {transcript}")
         return transcript, {'display': 'none'}
 @app.callback(
     return dict(content=transcript, filename="transcript.txt")
 if __name__ == '__main__':
+    logger.info("Starting the Dash application...")
     app.run(debug=True, host='0.0.0.0', port=7860)
+    logger.info("Dash application has finished running.")