Spaces:
Running
Running
YouTubeTranscriptApi
Browse files- app.py +5 -1
- requirements.txt +2 -1
app.py
CHANGED
|
@@ -6,6 +6,8 @@ from docx import Document
|
|
| 6 |
import os
|
| 7 |
from openai import OpenAI
|
| 8 |
import json
|
|
|
|
|
|
|
| 9 |
|
| 10 |
OPEN_AI_KEY = os.getenv("OPEN_AI_KEY")
|
| 11 |
client = OpenAI(api_key=OPEN_AI_KEY)
|
|
@@ -50,7 +52,9 @@ def docx_to_text(file):
|
|
| 50 |
def process_youtube_link(link):
|
| 51 |
# 使用 YouTube API 获取逐字稿
|
| 52 |
# 假设您已经获取了 YouTube 视频的逐字稿并存储在变量 `transcript` 中
|
| 53 |
-
|
|
|
|
|
|
|
| 54 |
|
| 55 |
# 基于逐字稿生成其他所需的输出
|
| 56 |
questions = generate_questions(transcript)
|
|
|
|
| 6 |
import os
|
| 7 |
from openai import OpenAI
|
| 8 |
import json
|
| 9 |
+
from youtube_transcript_api import YouTubeTranscriptApi
|
| 10 |
+
|
| 11 |
|
| 12 |
OPEN_AI_KEY = os.getenv("OPEN_AI_KEY")
|
| 13 |
client = OpenAI(api_key=OPEN_AI_KEY)
|
|
|
|
| 52 |
def process_youtube_link(link):
|
| 53 |
# 使用 YouTube API 获取逐字稿
|
| 54 |
# 假设您已经获取了 YouTube 视频的逐字稿并存储在变量 `transcript` 中
|
| 55 |
+
video_id = link.split("=")[-1]
|
| 56 |
+
transcript = YouTubeTranscriptApi.get_transcript(video_id, languages=['zh-TW'])
|
| 57 |
+
|
| 58 |
|
| 59 |
# 基于逐字稿生成其他所需的输出
|
| 60 |
questions = generate_questions(transcript)
|
requirements.txt
CHANGED
|
@@ -3,4 +3,5 @@ pandas
|
|
| 3 |
openai>=1.0.0
|
| 4 |
requests
|
| 5 |
beautifulsoup4
|
| 6 |
-
python-docx
|
|
|
|
|
|
| 3 |
openai>=1.0.0
|
| 4 |
requests
|
| 5 |
beautifulsoup4
|
| 6 |
+
python-docx
|
| 7 |
+
youtube-transcript-api
|