Spaces:

JunyiAcademy
/

vaitor2

Sleeping

App Files Files Community

youngtsai commited on Jan 19, 2024

Commit

a41dfa9

1 Parent(s): a11ae70

transcript_html

Browse files

Files changed (1) hide show

app.py +20 -3

app.py CHANGED Viewed

@@ -69,20 +69,35 @@ def process_youtube_link(link):
     for entry in transcript:
         start_time = format_seconds_to_time(entry['start'])
         end_time = format_seconds_to_time(entry['start'] + entry['duration'])
         line = {
             "start_time": start_time,
             "end_time": end_time,
             "text": entry['text'],
-            "screenshot": get_screenshot_from_video(link, entry['start'])
         }
         formatted_transcript.append(line)
     # 确保返回与 UI 组件预期匹配的输出
     return questions[0] if len(questions) > 0 else "", \
             questions[1] if len(questions) > 1 else "", \
             questions[2] if len(questions) > 2 else "", \
             df_summarise, \
-            formatted_transcript
 def get_screenshot_from_video(video_link, start_time):
     # 实现从视频中提取帧的逻辑
@@ -209,6 +224,8 @@ with gr.Blocks() as demo:
             send_button = gr.Button("Send")
         with gr.Column():
             with gr.Tab("資料本文"):
                 df_string_output = gr.Textbox()
             with gr.Tab("資料摘要"):
@@ -236,7 +253,7 @@ with gr.Blocks() as demo:
     file_upload.change(process_file, inputs=file_upload, outputs=[btn_1, btn_2, btn_3, df_summarise, df_string_output])
     # 当输入 YouTube 链接时触发
-    youtube_link.change(process_youtube_link, inputs=youtube_link, outputs=[btn_1, btn_2, btn_3, df_summarise, df_string_output])
     # 当输入网页链接时触发
     web_link.change(process_web_link, inputs=web_link, outputs=[btn_1, btn_2, btn_3, df_summarise, df_string_output])

     for entry in transcript:
         start_time = format_seconds_to_time(entry['start'])
         end_time = format_seconds_to_time(entry['start'] + entry['duration'])
+        embed_url = get_embedded_youtube_link(video_id, entry['start'])
         line = {
             "start_time": start_time,
             "end_time": end_time,
             "text": entry['text'],
+            "embed_url": embed_url
         }
         formatted_transcript.append(line)
+    html_content = format_transcript_to_html(formatted_transcript)
     # 确保返回与 UI 组件预期匹配的输出
     return questions[0] if len(questions) > 0 else "", \
             questions[1] if len(questions) > 1 else "", \
             questions[2] if len(questions) > 2 else "", \
             df_summarise, \
+            html_content
+def format_transcript_to_html(formatted_transcript):
+    html_content = ""
+    for entry in formatted_transcript:
+        html_content += f"<h3>{entry['start_time']} - {entry['end_time']}</h3>"
+        html_content += f"<p>{entry['text']}</p>"
+        html_content += f"<iframe width='560' height='315' src='{entry['embed_url']}' frameborder='0' allowfullscreen></iframe><br><br>"
+    return html_content
+def get_embedded_youtube_link(video_id, start_time):
+    embed_url = f"https://www.youtube.com/embed/{video_id}?start={start_time}&autoplay=1"
+    return embed_url
 def get_screenshot_from_video(video_link, start_time):
     # 实现从视频中提取帧的逻辑
             send_button = gr.Button("Send")
         with gr.Column():
+            with gr.Tab("YouTube Transcript and Video"):
+                transcript_html = gr.HTML(label="YouTube Transcript and Video")
             with gr.Tab("資料本文"):
                 df_string_output = gr.Textbox()
             with gr.Tab("資料摘要"):
     file_upload.change(process_file, inputs=file_upload, outputs=[btn_1, btn_2, btn_3, df_summarise, df_string_output])
     # 当输入 YouTube 链接时触发
+    youtube_link.change(process_youtube_link, inputs=youtube_link, outputs=[btn_1, btn_2, btn_3, df_summarise, transcript_html])
     # 当输入网页链接时触发
     web_link.change(process_web_link, inputs=web_link, outputs=[btn_1, btn_2, btn_3, df_summarise, df_string_output])