Final_Assignment_Template

Sleeping

Luigi D'Addona commited on Jun 27, 2025

Commit

ffe7776

1 Parent(s): 1a64e3b

il tool get_youtube_transcript() ora restituisce un dict con i campi "transcript" e "metadata"

Files changed (1) hide show

tools.py CHANGED Viewed

@@ -318,13 +318,27 @@ def arxiv_search(query: str) -> str:
 @tool
-def get_youtube_transcript(url: str) -> str:
-    """
-    Fetches the transcript from a YouTube video URL and returns it as plain text.
     """
-    loader = YoutubeLoader.from_youtube_url(url, add_video_info=True)
-    docs = loader.load()
-    # Combine all transcript chunks into a single string
-    transcript = "\n".join(doc.page_content for doc in docs)
-    return transcript

 @tool
+def get_youtube_transcript(url: str) -> dict:
+    """Fetches the transcript from a YouTube video URL.
+    Args:
+        url: The URL of the YouTube video.
+    Returns:
+        A dictionary containing the transcript and metadata.
+        The dictionary will have keys "transcript" (string, the video transcript or an error message) and "metadata" (dictionary, containing video title and other information, if available, otherwise empty).
     """
+    try:
+        loader = YoutubeLoader.from_youtube_url(url, add_video_info=True)
+        docs = loader.load()
+        # Combine all transcript chunks into a single string
+        transcript = "\n".join(doc.page_content for doc in docs)
+        metadata = docs[0].metadata if docs else {}
+        return {"transcript": transcript, "metadata": metadata}
+    except Exception as e:
+        if "Could not retrieve transcript" in str(e):
+            return {"transcript": "No transcript available for this video.", "metadata": {}}
+        else:
+            return {"transcript": f"Error fetching transcript: {e}", "metadata": {}}