Spaces:

samir72
/

AudioChatTranscriber

Running

App Files Files Community

samir72 commited on Sep 19, 2025

Commit

ec7331c

1 Parent(s): 9865a29

Error handling

Browse files

Files changed (3) hide show

Youtubetranscription_summarizer.py +9 -3
__pycache__/Youtubetranscription_summarizer.cpython-313.pyc +0 -0
app.py +25 -13

Youtubetranscription_summarizer.py CHANGED Viewed

@@ -25,14 +25,17 @@ def nslookup(domain):
         # Perform DNS lookup for the domain
         addresses = socket.getaddrinfo(domain, None)
         print(f"DNS lookup succesfull for {domain}:")
         # for addr in addresses:
         #     # Extract IP address from the result
         #     ip = addr[4][0]
         #     print(f"IP Address: {ip}")
     except socket.gaierror as e:
         print(f"DNS lookup failed for {domain}: {e}")
     except Exception as e:
         print(f"An unexpected error occurred: {e}")
 def extract_domain(url):
     # Regular expression to match the domain name
@@ -146,12 +149,14 @@ def download_youtube_audio_wav16k_api(
         with yt_dlp.YoutubeDL(ydl_opts) as ydl:
             ydl.extract_info(youtube_url, download=True)
     except Exception as e:
-        raise YTDLPError(f"yt-dlp API failed: {e}") from e
     # Locate the produced WAV (pre-downsampled)
     pre_wavs = list(work_dir.glob("*.wav"))
     if not pre_wavs:
-        raise YTDLPError("yt-dlp completed but no WAV was found.")
     pre_wav = max(pre_wavs, key=lambda p: p.stat().st_mtime)
     # Second stage: force 16 kHz mono via ffmpeg
@@ -171,7 +176,8 @@ def download_youtube_audio_wav16k_api(
             text=True,
         )
     except subprocess.CalledProcessError as e:
-        raise YTDLPError(f"ffmpeg failed to resample: {e.stderr or e.stdout}") from e
     # Clean up intermediates if desired
     if not keep_intermediate:

         # Perform DNS lookup for the domain
         addresses = socket.getaddrinfo(domain, None)
         print(f"DNS lookup succesfull for {domain}:")
+        return True
         # for addr in addresses:
         #     # Extract IP address from the result
         #     ip = addr[4][0]
         #     print(f"IP Address: {ip}")
     except socket.gaierror as e:
         print(f"DNS lookup failed for {domain}: {e}")
+        return False
     except Exception as e:
         print(f"An unexpected error occurred: {e}")
+        return False
 def extract_domain(url):
     # Regular expression to match the domain name
         with yt_dlp.YoutubeDL(ydl_opts) as ydl:
             ydl.extract_info(youtube_url, download=True)
     except Exception as e:
+        #raise YTDLPError(f"yt-dlp API failed: {e}") from e
+        return f"yt-dlp API failed: {e}"
     # Locate the produced WAV (pre-downsampled)
     pre_wavs = list(work_dir.glob("*.wav"))
     if not pre_wavs:
+        #raise YTDLPError("yt-dlp completed but no WAV was found.")
+        return "yt-dlp completed but no WAV was found."
     pre_wav = max(pre_wavs, key=lambda p: p.stat().st_mtime)
     # Second stage: force 16 kHz mono via ffmpeg
             text=True,
         )
     except subprocess.CalledProcessError as e:
+        #raise YTDLPError(f"ffmpeg failed to resample: {e.stderr or e.stdout}") from e
+        return f"ffmpeg failed to resample: {e.stderr or e.stdout}"
     # Clean up intermediates if desired
     if not keep_intermediate:

__pycache__/Youtubetranscription_summarizer.cpython-313.pyc CHANGED Viewed

Binary files a/__pycache__/Youtubetranscription_summarizer.cpython-313.pyc and b/__pycache__/Youtubetranscription_summarizer.cpython-313.pyc differ

app.py CHANGED Viewed

@@ -13,7 +13,7 @@ import re
 # --- LLM call (Azure OpenAI with API key) -----------------------------------
-def summarize_input(audio_b64: str = None, text_input: str = None, sys_prompt: str = None, user_prompt: str = None) -> str:
     """
     Calls Azure OpenAI Chat Completions with audio input (base64 mp3) or text input, or both.
     """
@@ -82,7 +82,9 @@ def summarize_input(audio_b64: str = None, text_input: str = None, sys_prompt: s
                 {"role": "user", "content": content},
             ],
         )
-        print(f"Azure API call at {datetime.now()}: prompt_length={len(user_prompt or '')}, "
               f"audio_size={len(audio_b64 or '')}, text_input_size={len(json_text or '')}")
         return response.choices[0].message.content
@@ -132,7 +134,11 @@ def process_audio(upload_path, record_path, url, sys_prompt, user_prompt):
     tmp_to_cleanup = []
     audio_b64 = None
     text_input = None
     try:
         audio_path = None
         if upload_path:
             audio_path = upload_path
@@ -142,23 +148,29 @@ def process_audio(upload_path, record_path, url, sys_prompt, user_prompt):
             # Check dns resolution of the url domain
             domain = Youtubetranscription_summarizer.extract_domain(url)
             if domain:
-                Youtubetranscription_summarizer.nslookup(domain)  # Check DNS resolution of the domain
-            #Check if it's a youtube url
-            CheckURL = re.search(r"Youtube", url, re.IGNORECASE)
-            if CheckURL:
-                # Get the transcription from youtube
-                text_input = Youtubetranscription_summarizer.main(url.strip()) # Youtube files are transcribed and summarized
-                tmp_to_cleanup.append(text_input)
-            else:
-                audio_path = download_to_temp_mp3(url.strip())
-                tmp_to_cleanup.append(audio_path)
         if not audio_path and text_input is None:
             return "Please provide content via upload, recording, or URL."
         # If we have an audio file, encode it
         if audio_path:
             audio_b64 = encode_audio_from_path(audio_path)
-        return summarize_input(audio_b64, text_input, sys_prompt, user_prompt)
     except Exception as e:
         return print(f"Error processing audio at {datetime.now()}: prompt_length={len(user_prompt)}, audio_path={audio_path}: {str(e)}")

 # --- LLM call (Azure OpenAI with API key) -----------------------------------
+def summarize_input(audio_b64: str = None, text_input: str = None, sys_prompt: str = None, user_prompt: str = None, Starttime: datetime = None) -> str:
     """
     Calls Azure OpenAI Chat Completions with audio input (base64 mp3) or text input, or both.
     """
                 {"role": "user", "content": content},
             ],
         )
+        Enddate = datetime.now()
+        Callduration = Enddate - Starttime[0]
+        print(f"Azure API call with a duration of {Callduration}: prompt_length={len(user_prompt or '')}, "
               f"audio_size={len(audio_b64 or '')}, text_input_size={len(json_text or '')}")
         return response.choices[0].message.content
     tmp_to_cleanup = []
     audio_b64 = None
     text_input = None
+    domaincheck = None
     try:
+        # Capture start time for logging
+        Starttime = datetime.now(),
+        print(f"Azure API call starts at {datetime.now()}"),
         audio_path = None
         if upload_path:
             audio_path = upload_path
             # Check dns resolution of the url domain
             domain = Youtubetranscription_summarizer.extract_domain(url)
             if domain:
+                domaincheck = Youtubetranscription_summarizer.nslookup(domain)  # Check DNS resolution of the domain
+            else:
+                return "Invalid URL format."
+            if domaincheck:
+                # Check if the url is a youtube link
+                CheckURL = re.search(r"Youtube", url, re.IGNORECASE)
+                if CheckURL:
+                    # Get the transcription from youtube
+                    text_input = Youtubetranscription_summarizer.main(url.strip()) # Youtube files are transcribed and summarized
+                    tmp_to_cleanup.append(text_input)
+                else:
+                    audio_path = download_to_temp_mp3(url.strip())
+                    tmp_to_cleanup.append(audio_path)
+            else:
+                return f"DNS lookup failed for {domain}"
         if not audio_path and text_input is None:
             return "Please provide content via upload, recording, or URL."
         # If we have an audio file, encode it
         if audio_path:
             audio_b64 = encode_audio_from_path(audio_path)
+        return summarize_input(audio_b64, text_input, sys_prompt, user_prompt, Starttime)
     except Exception as e:
         return print(f"Error processing audio at {datetime.now()}: prompt_length={len(user_prompt)}, audio_path={audio_path}: {str(e)}")