Spaces:

GoodML
/

dishDecode

Sleeping

GoodML commited on Nov 26, 2024

Commit

7844e16

verified ·

1 Parent(s): 58418df

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -96,25 +96,26 @@ def process_youtube():
         return jsonify({"error": "No YouTube URL provided"}), 400
     try:
-        # Extract the YouTube video ID from the URL
-        video_id = youtube_url.split("=")[1]
-        transcript = ""
-        try:
-            # Fetch the transcript for the video using YouTubeTranscriptApi
-            transcript_data = YouTubeTranscriptApi.get_transcript(video_id)
-            # Concatenate the text from each segment into a single transcript
-            transcript = " ".join([segment['text'] for segment in transcript_data])
-        except Exception as e:
-            print(f"Error fetching transcript for video ID {video_id}: {e}")
-        if not transcript:
-            return jsonify({"error": f"Unable to fetch transcript from YouTube: {transcript}"}), 500
         # Send the transcript to the Gemini API for structured data
         structured_data = query_gemini_api(transcript)
         # Return the structured data
         return jsonify(structured_data)

         return jsonify({"error": "No YouTube URL provided"}), 400
     try:
+    """
+    Fetches the transcript of a YouTube video using the YouTube Transcript API.
+    """
+        # Extract the video ID from the YouTube URL
+        video_id = youtube_url.split("v=")[-1].split("&")[0]
+        # Fetch the transcript for the given video ID
+        transcript_data = YouTubeTranscriptApi.get_transcript(video_id)
+        # Print transcript to console
+        print(f"Transcript for video ID {video_id}:")
+        transcript = " ".join([segment['text'] for segment in transcript_data])
         # Send the transcript to the Gemini API for structured data
         structured_data = query_gemini_api(transcript)
         # Return the structured data
         return jsonify(structured_data)