mangubee Claude commited on
Commit
a170083
·
1 Parent(s): c9e941b

fix: youtube transcript API and missing datasets dependency

Browse files

- Changed YouTubeTranscriptApi.get_transcript to .fetch (API changed)
- Added datasets>=4.4.0 to pyproject.toml (was missing)

Co-Authored-By: Claude <noreply@anthropic.com>

Files changed (2) hide show
  1. pyproject.toml +1 -0
  2. src/tools/youtube.py +1 -1
pyproject.toml CHANGED
@@ -36,6 +36,7 @@ dependencies = [
36
  "gradio[oauth]>=5.0.0",
37
  "pandas>=2.2.0",
38
  "tenacity>=9.1.2",
 
39
  "groq>=1.0.0",
40
  ]
41
 
 
36
  "gradio[oauth]>=5.0.0",
37
  "pandas>=2.2.0",
38
  "tenacity>=9.1.2",
39
+ "datasets>=4.4.0",
40
  "groq>=1.0.0",
41
  ]
42
 
src/tools/youtube.py CHANGED
@@ -111,7 +111,7 @@ def get_youtube_transcript(video_id: str) -> Dict[str, Any]:
111
  logger.info(f"Fetching transcript for video: {video_id}")
112
 
113
  # Get transcript (auto-detect language, prefer English)
114
- transcript_list = YouTubeTranscriptApi.get_transcript(
115
  video_id,
116
  languages=['en', 'en-US', 'en-GB']
117
  )
 
111
  logger.info(f"Fetching transcript for video: {video_id}")
112
 
113
  # Get transcript (auto-detect language, prefer English)
114
+ transcript_list = YouTubeTranscriptApi.fetch(
115
  video_id,
116
  languages=['en', 'en-US', 'en-GB']
117
  )