Spaces:

Sayiqa
/

deployment

Sleeping

App Files Files Community

Sayiqa commited on Dec 30, 2024

Commit

985d66e

verified ·

1 Parent(s): c421f22

Update app.py

Browse files

Files changed (1) hide show

app.py +30 -25

app.py CHANGED Viewed

@@ -391,38 +391,43 @@ def process_youtube_video(url="", keywords=""):
         if not video_id:
             return thumbnail, "Invalid YouTube URL", sentiment_label, recommendations
-        video_id = extract_video_id(url)
-        if not video_id:
-            return thumbnail, "Invalid YouTube URL", sentiment_label, recommendations
-        # Set thumbnail
         thumbnail = f"https://img.youtube.com/vi/{video_id}/maxresdefault.jpg"
         try:
-            # Get transcript
-            transcript_list = YouTubeTranscriptApi.list_transcripts(video_id)
-            transcript = None
-            # Try different transcript options
-            for lang in ['en', 'en-US', 'a.en']:
                 try:
-                    transcript = transcript_list.find_transcript([lang])
-                    break
                 except:
-                    continue
-            if not transcript:
-                transcript = transcript_list.find_generated_transcript(['en'])
-            # Get transcript text
-            text = " ".join([t['text'] for t in transcript.fetch()])
-            # Clean text
             cleaned_text = re.sub(r'[^\w\s.]', '', text)
             cleaned_text = ' '.join(cleaned_text.split())
             # Sentiment Analysis
-            blob = TextBlob(cleaned_text[:2000])  # Analyze first 2000 chars
             polarity = blob.sentiment.polarity
             subjectivity = blob.sentiment.subjectivity
@@ -436,10 +441,9 @@ def process_youtube_video(url="", keywords=""):
             model = genai.GenerativeModel("gemini-pro")
             summary = model.generate_content(f"Summarize this content: {cleaned_text[:4000]}").text
-        except (TranscriptsDisabled, NoTranscriptFound):
-            return thumbnail, "⚠️ No English subtitles available", "N/A", recommendations
         except Exception as e:
-            return thumbnail, f"⚠️ Error: {str(e)}", "N/A", recommendations
         # Get recommendations
         if keywords.strip():
@@ -448,6 +452,7 @@ def process_youtube_video(url="", keywords=""):
         return thumbnail, summary, sentiment_label, recommendations
     except Exception as e:
         return None, f"Error: {str(e)}", "N/A", ""

         if not video_id:
             return thumbnail, "Invalid YouTube URL", sentiment_label, recommendations
         thumbnail = f"https://img.youtube.com/vi/{video_id}/maxresdefault.jpg"
         try:
+            # Method 1: Direct transcript fetch
+            try:
+                transcript = YouTubeTranscriptApi.get_transcript(video_id, languages=['en'])
+                text = " ".join([t['text'] for t in transcript])
+            except:
+                # Method 2: Try list_transcripts
                 try:
+                    transcript_list = YouTubeTranscriptApi.list_transcripts(video_id)
+                    # Try multiple language variants
+                    for lang_code in ['en', 'en-US', 'en-GB', 'a.en']:
+                        try:
+                            transcript = transcript_list.find_transcript([lang_code])
+                            text = " ".join([t['text'] for t in transcript.fetch()])
+                            break
+                        except:
+                            continue
+                    # If no English transcript found, try auto-generated
+                    if 'text' not in locals():
+                        transcript = transcript_list.find_generated_transcript(['en'])
+                        text = " ".join([t['text'] for t in transcript.fetch()])
                 except:
+                    # Method 3: Try translation
+                    available_transcripts = transcript_list.find_manually_created_transcript()
+                    translated = available_transcripts.translate('en')
+                    text = " ".join([t['text'] for t in translated.fetch()])
+            # Clean and process text
             cleaned_text = re.sub(r'[^\w\s.]', '', text)
             cleaned_text = ' '.join(cleaned_text.split())
             # Sentiment Analysis
+            blob = TextBlob(cleaned_text[:2000])
             polarity = blob.sentiment.polarity
             subjectivity = blob.sentiment.subjectivity
             model = genai.GenerativeModel("gemini-pro")
             summary = model.generate_content(f"Summarize this content: {cleaned_text[:4000]}").text
         except Exception as e:
+            print(f"Debug - Transcript Error: {str(e)}")  # Debug logging
+            return thumbnail, f"⚠️ Unable to process video: {str(e)}", "N/A", recommendations
         # Get recommendations
         if keywords.strip():
         return thumbnail, summary, sentiment_label, recommendations
     except Exception as e:
+        print(f"Debug - Main Error: {str(e)}")  # Debug logging
         return None, f"Error: {str(e)}", "N/A", ""