Spaces:

MicroHealth
/

AV-to-transcripts

Paused

App Files Files Community

bluenevus commited on Apr 26, 2025

Commit

04933a2

verified ·

1 Parent(s): 953582f

Update app.py

Browse files

Files changed (1) hide show

app.py +66 -50

app.py CHANGED Viewed

@@ -7,7 +7,7 @@ import logging
 from urllib.parse import urlparse
 import dash
-from dash import dcc, html, Input, Output, State
 import dash_bootstrap_components as dbc
 from dash.exceptions import PreventUpdate
@@ -101,19 +101,6 @@ def extract_audio(file_path):
         logger.error(f"Error extracting audio: {str(e)}")
         raise
-def transcribe_audio(file_path):
-    logger.info(f"Transcribing audio: {file_path}")
-    try:
-        with open(file_path, "rb") as audio_file:
-            audio_data = audio_file.read()
-        response = model.generate_content(audio_data)
-        logger.info("Transcription completed successfully")
-        return response.text
-    except Exception as e:
-        logger.error(f"Error during transcription: {str(e)}")
-        raise
 def process_media(contents, filename, url):
     logger.info("Starting media processing")
     try:
@@ -134,14 +121,22 @@ def process_media(contents, filename, url):
         if temp_file_path.lower().endswith(('.mp4', '.avi', '.mov', '.flv', '.wmv')):
             logger.info("Video file detected, extracting audio")
             audio_file_path = extract_audio(temp_file_path)
-            transcript = transcribe_audio(audio_file_path)
             os.unlink(audio_file_path)
         else:
-            logger.info("Audio file detected, transcribing directly")
-            transcript = transcribe_audio(temp_file_path)
         os.unlink(temp_file_path)
-        return transcript
     except Exception as e:
         logger.error(f"Error in process_media: {str(e)}")
         raise
@@ -168,56 +163,77 @@ app.layout = dbc.Container([
                 },
                 multiple=False
             ),
             dbc.Input(id="media-url", type="text", placeholder="Enter audio/video URL or YouTube link", className="my-3"),
             dbc.Button("Transcribe", id="transcribe-button", color="primary", className="w-100 mb-3"),
             dbc.Spinner(html.Div(id="transcription-output", className="mt-3")),
             dbc.Button("Download Transcript", id="download-button", color="secondary", className="w-100 mt-3", style={'display': 'none'}),
-            dcc.Download(id="download-transcript")
         ])
     ])
 ])
 @app.callback(
     Output("transcription-output", "children"),
     Output("download-button", "style"),
     Input("transcribe-button", "n_clicks"),
     State("upload-media", "contents"),
     State("upload-media", "filename"),
     State("media-url", "value"),
     prevent_initial_call=True
 )
-def update_transcription(n_clicks, contents, filename, url):
-    if not contents and not url:
-        raise PreventUpdate
-    def transcribe():
-        try:
-            return process_media(contents, filename, url)
-        except Exception as e:
-            logger.error(f"Transcription failed: {str(e)}")
-            return f"An error occurred: {str(e)}"
-    thread = threading.Thread(target=transcribe)
-    thread.start()
-    thread.join(timeout=600)  # 10 minutes timeout
-    if thread.is_alive():
-        logger.warning("Transcription timed out after 10 minutes")
-        return "Transcription timed out after 10 minutes", {'display': 'none'}
-    transcript = getattr(thread, 'result', "Transcription failed")
-    if transcript and not transcript.startswith("An error occurred"):
-        logger.info("Transcription successful")
-        return dbc.Card([
-            dbc.CardBody([
-                html.H5("Transcription Result"),
-                html.Pre(transcript, style={"white-space": "pre-wrap", "word-wrap": "break-word"})
-            ])
-        ]), {'display': 'block'}
-    else:
-        logger.error(f"Transcription failed: {transcript}")
-        return transcript, {'display': 'none'}
 @app.callback(
     Output("download-transcript", "data"),

 from urllib.parse import urlparse
 import dash
+from dash import dcc, html, Input, Output, State, callback_context
 import dash_bootstrap_components as dbc
 from dash.exceptions import PreventUpdate
         logger.error(f"Error extracting audio: {str(e)}")
         raise
 def process_media(contents, filename, url):
     logger.info("Starting media processing")
     try:
         if temp_file_path.lower().endswith(('.mp4', '.avi', '.mov', '.flv', '.wmv')):
             logger.info("Video file detected, extracting audio")
             audio_file_path = extract_audio(temp_file_path)
+            with open(audio_file_path, "rb") as audio_file:
+                audio_data = audio_file.read()
             os.unlink(audio_file_path)
         else:
+            logger.info("Audio file detected, reading directly")
+            with open(temp_file_path, "rb") as audio_file:
+                audio_data = audio_file.read()
         os.unlink(temp_file_path)
+        # Create a Blob object from the audio data
+        audio_blob = genai.types.Blob(data=audio_data, mime_type="audio/wav")
+        response = model.generate_content(audio_blob)
+        logger.info("Transcription completed successfully")
+        return response.text
     except Exception as e:
         logger.error(f"Error in process_media: {str(e)}")
         raise
                 },
                 multiple=False
             ),
+            html.Div(id='file-info', className="mt-2"),
             dbc.Input(id="media-url", type="text", placeholder="Enter audio/video URL or YouTube link", className="my-3"),
             dbc.Button("Transcribe", id="transcribe-button", color="primary", className="w-100 mb-3"),
             dbc.Spinner(html.Div(id="transcription-output", className="mt-3")),
+            html.Div(id="progress-indicator", className="text-center mt-3"),
             dbc.Button("Download Transcript", id="download-button", color="secondary", className="w-100 mt-3", style={'display': 'none'}),
+            dcc.Download(id="download-transcript"),
+            dcc.Interval(id='progress-interval', interval=500, n_intervals=0, disabled=True)
         ])
     ])
 ])
+@app.callback(
+    Output("file-info", "children"),
+    Input("upload-media", "filename"),
+    Input("upload-media", "last_modified")
+)
+def update_file_info(filename, last_modified):
+    if filename is not None:
+        return f"File uploaded: {filename}"
+    return ""
 @app.callback(
     Output("transcription-output", "children"),
     Output("download-button", "style"),
+    Output("progress-indicator", "children"),
+    Output("progress-interval", "disabled"),
     Input("transcribe-button", "n_clicks"),
+    Input("progress-interval", "n_intervals"),
     State("upload-media", "contents"),
     State("upload-media", "filename"),
     State("media-url", "value"),
     prevent_initial_call=True
 )
+def update_transcription(n_clicks, n_intervals, contents, filename, url):
+    ctx = callback_context
+    if ctx.triggered_id == "transcribe-button":
+        if not contents and not url:
+            raise PreventUpdate
+        def transcribe():
+            try:
+                return process_media(contents, filename, url)
+            except Exception as e:
+                logger.error(f"Transcription failed: {str(e)}")
+                return f"An error occurred: {str(e)}"
+        thread = threading.Thread(target=transcribe)
+        thread.start()
+        return html.Div("Processing..."), {'display': 'none'}, "", False
+    elif ctx.triggered_id == "progress-interval":
+        dots = "." * (n_intervals % 4)
+        return html.Div("Processing" + dots), {'display': 'none'}, "", False
+    thread = threading.current_thread()
+    if hasattr(thread, 'result'):
+        transcript = thread.result
+        if transcript and not transcript.startswith("An error occurred"):
+            logger.info("Transcription successful")
+            return dbc.Card([
+                dbc.CardBody([
+                    html.H5("Transcription Result"),
+                    html.Pre(transcript, style={"white-space": "pre-wrap", "word-wrap": "break-word"})
+                ])
+            ]), {'display': 'block'}, "", True
+        else:
+            logger.error(f"Transcription failed: {transcript}")
+            return transcript, {'display': 'none'}, "", True
+    return dash.no_update, dash.no_update, dash.no_update, dash.no_update
 @app.callback(
     Output("download-transcript", "data"),