lgsantini1 commited on
Commit
8f41d61
·
verified ·
1 Parent(s): 7517ea5

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +28 -33
app.py CHANGED
@@ -1,38 +1,33 @@
1
- import re
2
  import gradio as gr
3
- from youtube_transcript_api import YouTubeTranscriptApi
 
 
 
 
 
 
 
4
 
5
- def extract_video_id(youtube_url):
6
- # Regex para extrair o ID do vídeo da URL do YouTube
7
- match = re.search(r'(?:youtu\.be\/|(?:www\.)?youtube\.com\/(?:watch\?v=|embed\/|v\/|.+\?v=))([^&]{11})', youtube_url)
8
- return match.group(1) if match else None
9
 
10
- def get_transcript(video_id, language="en"):
11
  try:
12
- transcript = YouTubeTranscriptApi.get_transcript(video_id, languages=[language])
13
- return "\n".join([f"{t['start']}: {t['text']}" for t in transcript])
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
14
  except Exception as e:
15
- return f"Erro ao obter transcrição: {str(e)}"
16
-
17
- # Função que combina a extração do ID e a obtenção da transcrição
18
- def gradio_interface(youtube_url, language):
19
- video_id = extract_video_id(youtube_url)
20
- if not video_id:
21
- return "Erro: URL inválida. Por favor, insira um link válido do YouTube."
22
-
23
- return get_transcript(video_id, language)
24
-
25
- # Criação da interface Gradio
26
- iface = gr.Interface(
27
- fn=gradio_interface,
28
- inputs=[
29
- gr.Textbox(label="URL do Vídeo (YouTube)", placeholder="Ex: https://www.youtube.com/watch?v=tl1jHm0qC_4"),
30
- gr.Dropdown(label="Idioma", choices=["en", "pt", "es", "fr"], value="en")
31
- ],
32
- outputs="text",
33
- title="Obter Transcrição de Vídeos do YouTube",
34
- description="Insira a URL de um vídeo do YouTube e selecione o idioma da transcrição."
35
- )
36
-
37
- # Execução da interface Gradio
38
- iface.launch(share=True)
 
 
1
  import gradio as gr
2
+ from langchain_community.document_loaders import YoutubeLoader
3
+
4
+ from langchain_core.prompts import ChatPromptTemplate
5
+ from youtube_transcript_api import NoTranscriptFound
6
+ from pytube.exceptions import PytubeError
7
+
8
+ def load_youtube_video_info(url):
9
+ # Initialize YouTube loader with preferred language as Portuguese
10
 
 
 
 
 
11
 
 
12
  try:
13
+ loader = YoutubeLoader.from_youtube_url(url, add_video_info=True, language="pt")
14
+
15
+ # Load the video information and transcript
16
+ result = loader.load()
17
+
18
+ if result:
19
+ # Retrieve metadata information
20
+ author = result[0].metadata.get('author', 'Unknown Author')
21
+ length = result[0].metadata.get('length', 'Unknown Length')
22
+ # Check if transcript is available
23
+ transcript = result[0].page_content if hasattr(result[0], 'page_content') else "No transcript available."
24
+
25
+ info = "No result found."
26
+ except NoTranscriptFound:
27
+ info = "Transcript not found for this video."
28
+ except PytubeError as e:
29
+ info = f"Error loading video information: {str(e)}"
30
  except Exception as e:
31
+ info = f"An unexpected error occurred: {str(e)}"
32
+
33
+ return info