Video_Convergence_test

Sleeping

App Files Files Community

EU-IA commited on Aug 28, 2025

Commit

7d6ac50

verified ·

1 Parent(s): 66617c2

Update app.py

Browse files

Files changed (1) hide show

app.py +36 -30

app.py CHANGED Viewed

@@ -1,4 +1,4 @@
-#--- START OF FILE app.py ---
 import gradio as gr
 import cv2
@@ -8,7 +8,7 @@ import matplotlib.pyplot as plt
 from PIL import Image
 import imagehash
 import torch
-from scipy.stats import pearsonr
 import os
 # --- MÓDULO DE INICIALIZAÇÃO ---
@@ -36,9 +36,8 @@ except Exception as e:
 # --- FUNÇÕES DE ANÁLISE ---
-# --- MODIFICADO ---
-# Agora aceita start_frame e end_frame para analisar apenas um trecho.
 def analisar_fidelidade(video_path, start_frame=0, end_frame=0):
     cap = cv2.VideoCapture(video_path)
     if not cap.isOpened():
         raise gr.Error("Não foi possível abrir o arquivo de vídeo.")
@@ -47,7 +46,7 @@ def analisar_fidelidade(video_path, start_frame=0, end_frame=0):
     fps = cap.get(cv2.CAP_PROP_FPS) or 30
     total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
-    # Valida e ajusta os frames de início e fim
     process_full_video = (start_frame == 0 and end_frame == 0) or (start_frame >= end_frame)
     if process_full_video:
@@ -160,15 +159,13 @@ def executar_teste_semantico(phash_distances, descriptions_text):
     # (Função como definida anteriormente)
     return None, "Função ainda não implementada completamente no template"
-# --- NOVA FUNÇÃO ---
-# Extrai frames de um trecho e os une em uma única imagem.
 def extrair_e_visualizar_frames(video_path, start_frame, end_frame):
     if not video_path or start_frame >= end_frame:
         return None
     cap = cv2.VideoCapture(video_path)
-    if not cap.isOpened():
-        return None
     total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
     start_frame = max(0, start_frame)
@@ -176,27 +173,41 @@ def extrair_e_visualizar_frames(video_path, start_frame, end_frame):
     cap.set(cv2.CAP_PROP_POS_FRAMES, start_frame)
-    extracted_frames = []
     for i in range(start_frame, end_frame):
         ret, frame = cap.read()
-        if not ret:
-            break
-        # Adiciona texto com o número do frame
         frame_num_text = f"Frame: {i}"
         cv2.putText(frame, frame_num_text, (10, 30), cv2.FONT_HERSHEY_SIMPLEX, 1, (0, 0, 255), 2, cv2.LINE_AA)
-        extracted_frames.append(cv2.cvtColor(frame, cv2.COLOR_BGR2RGB))
     cap.release()
-    if not extracted_frames:
-        return None
-    # Une os frames horizontalmente
-    combined_image = np.hstack(extracted_frames)
-    # Salva a imagem combinada em um arquivo temporário
     pil_img = Image.fromarray(combined_image)
-    path = "frames_extraidos.png"
     pil_img.save(path)
     return path
@@ -246,14 +257,13 @@ def gerar_grafico_foco(ssim_global, ssim_foco, jitter, num_frames, fps):
     return plot_to_file(fig, "foco")
-# --- FUNÇÃO DE CALLBACK PRINCIPAL (MODIFICADA) ---
 def run_full_analysis(video_path, descriptions_text, start_frame, end_frame, progress=gr.Progress()):
     if video_path is None: raise gr.Error("Por favor, faça o upload de um vídeo.")
-    # Converte para inteiros
     start_frame, end_frame = int(start_frame), int(end_frame)
-    progress(0, desc="Extraindo frames para visualização...")
     frames_imagem_path = extrair_e_visualizar_frames(video_path, start_frame, end_frame)
     progress(0.1, desc="Analisando fidelidade do trecho...")
@@ -283,10 +293,9 @@ def run_full_analysis(video_path, descriptions_text, start_frame, end_frame, pro
         if error_msg: gr.Warning(error_msg)
     progress(1.0, desc="Análise completa!")
-    # --- MODIFICADO --- Retorna o caminho da nova imagem de frames também
     return frames_imagem_path, fidelidade_plot_path, cor_plot_path, foco_plot_path, semantico_path, anomalias_plot_path
-# --- INTERFACE GRADIO (MODIFICADA) ---
 with gr.Blocks(theme=gr.themes.Soft()) as demo:
     gr.Markdown("# Suíte de Validação Completa para Geração de Vídeo (ADUC-SDR)")
     with gr.Row():
@@ -294,7 +303,6 @@ with gr.Blocks(theme=gr.themes.Soft()) as demo:
             video_input = gr.Video(label="1. Upload do vídeo")
             descriptions_input = gr.Textbox(lines=5, label="3. Descrições (Opcional)", placeholder="Uma descrição por cena para o teste de inteligência...")
-            # --- NOVOS COMPONENTES ---
             with gr.Row():
                 start_frame_input = gr.Number(label="Frame Inicial", value=0, precision=0, info="Deixe 0 e 0 para analisar o vídeo inteiro.")
                 end_frame_input = gr.Number(label="Frame Final", value=0, precision=0, info="Ex: 88 e 94 para analisar esse trecho.")
@@ -302,9 +310,8 @@ with gr.Blocks(theme=gr.themes.Soft()) as demo:
             analyze_button = gr.Button("4. Executar Análise Completa", variant="primary")
     with gr.Tabs():
-        # --- NOVA ABA ---
         with gr.TabItem("Frames Extraídos"):
-            extracted_frames_img = gr.Image(label="Visualização dos Frames Lado a Lado")
         with gr.TabItem("1. Fidelidade e Coerência"):
             plot_fidelidade = gr.Image(label="Gráfico de Análise de Fidelidade (SSIM e pHash)")
         with gr.TabItem("2. Cor e Iluminação"):
@@ -316,11 +323,10 @@ with gr.Blocks(theme=gr.themes.Soft()) as demo:
         with gr.TabItem("5. Inteligência Adaptativa"):
             plot_semantico = gr.Image(label="Gráfico de Estresse Semântico")
-    # --- MODIFICADO --- Atualiza inputs e outputs do botão
     analyze_button.click(
         fn=run_full_analysis,
         inputs=[video_input, descriptions_input, start_frame_input, end_frame_input],
-        outputs=[extracted_frames_img, plot_fidelidade, plot_cor, plot_foco, plot_semantico, plot_anomalias]
     )
 if __name__ == "__main__":

+--- START OF FILE app.py ---
 import gradio as gr
 import cv2
 from PIL import Image
 import imagehash
 import torch
+import collections # Adicionado para a nova lógica de visualização
 import os
 # --- MÓDULO DE INICIALIZAÇÃO ---
 # --- FUNÇÕES DE ANÁLISE ---
 def analisar_fidelidade(video_path, start_frame=0, end_frame=0):
+    """Lê um trecho do vídeo e calcula as métricas de fidelidade (SSIM, pHash)."""
     cap = cv2.VideoCapture(video_path)
     if not cap.isOpened():
         raise gr.Error("Não foi possível abrir o arquivo de vídeo.")
     fps = cap.get(cv2.CAP_PROP_FPS) or 30
     total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
+    # Valida e ajusta os frames de início e fim. Se inválido, analisa o vídeo todo.
     process_full_video = (start_frame == 0 and end_frame == 0) or (start_frame >= end_frame)
     if process_full_video:
     # (Função como definida anteriormente)
     return None, "Função ainda não implementada completamente no template"
 def extrair_e_visualizar_frames(video_path, start_frame, end_frame):
+    """Extrai frames de um trecho e os organiza em uma grade alinhada a múltiplos de 8."""
     if not video_path or start_frame >= end_frame:
         return None
     cap = cv2.VideoCapture(video_path)
+    if not cap.isOpened(): return None
     total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
     start_frame = max(0, start_frame)
     cap.set(cv2.CAP_PROP_POS_FRAMES, start_frame)
+    extracted_frames, frame_shape = {}, None
     for i in range(start_frame, end_frame):
         ret, frame = cap.read()
+        if not ret: break
+        if frame_shape is None: frame_shape = frame.shape
         frame_num_text = f"Frame: {i}"
         cv2.putText(frame, frame_num_text, (10, 30), cv2.FONT_HERSHEY_SIMPLEX, 1, (0, 0, 255), 2, cv2.LINE_AA)
+        extracted_frames[i] = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
     cap.release()
+    if not extracted_frames: return None
+    # Cria um frame preto para usar como preenchimento
+    h, w, c = frame_shape
+    black_frame = np.zeros((h, w, c), dtype=np.uint8)
+    cv2.putText(black_frame, "VAZIO", (w//2 - 50, h//2), cv2.FONT_HERSHEY_SIMPLEX, 1, (100, 100, 100), 2)
+    # Determina o início e o fim da grade, alinhados a múltiplos de 8
+    grid_start = (start_frame // 8) * 8
+    grid_end = ((end_frame - 1) // 8 + 1) * 8
+    # Preenche um dicionário com os frames reais ou de preenchimento
+    rows_dict = collections.defaultdict(list)
+    for i in range(grid_start, grid_end):
+        row_index = i // 8
+        rows_dict[row_index].append(extracted_frames.get(i, black_frame))
+    # Monta as linhas horizontalmente e depois as empilha verticalmente
+    image_rows = [np.hstack(rows_dict[row_index]) for row_index in sorted(rows_dict.keys())]
+    combined_image = np.vstack(image_rows)
+    # Salva e retorna o caminho da imagem final
     pil_img = Image.fromarray(combined_image)
+    path = "frames_extraidos_grid.png"
     pil_img.save(path)
     return path
     return plot_to_file(fig, "foco")
+# --- FUNÇÃO DE CALLBACK PRINCIPAL ---
 def run_full_analysis(video_path, descriptions_text, start_frame, end_frame, progress=gr.Progress()):
     if video_path is None: raise gr.Error("Por favor, faça o upload de um vídeo.")
     start_frame, end_frame = int(start_frame), int(end_frame)
+    progress(0, desc="Extraindo e visualizando frames...")
     frames_imagem_path = extrair_e_visualizar_frames(video_path, start_frame, end_frame)
     progress(0.1, desc="Analisando fidelidade do trecho...")
         if error_msg: gr.Warning(error_msg)
     progress(1.0, desc="Análise completa!")
     return frames_imagem_path, fidelidade_plot_path, cor_plot_path, foco_plot_path, semantico_path, anomalias_plot_path
+# --- INTERFACE GRADIO ---
 with gr.Blocks(theme=gr.themes.Soft()) as demo:
     gr.Markdown("# Suíte de Validação Completa para Geração de Vídeo (ADUC-SDR)")
     with gr.Row():
             video_input = gr.Video(label="1. Upload do vídeo")
             descriptions_input = gr.Textbox(lines=5, label="3. Descrições (Opcional)", placeholder="Uma descrição por cena para o teste de inteligência...")
             with gr.Row():
                 start_frame_input = gr.Number(label="Frame Inicial", value=0, precision=0, info="Deixe 0 e 0 para analisar o vídeo inteiro.")
                 end_frame_input = gr.Number(label="Frame Final", value=0, precision=0, info="Ex: 88 e 94 para analisar esse trecho.")
             analyze_button = gr.Button("4. Executar Análise Completa", variant="primary")
     with gr.Tabs():
         with gr.TabItem("Frames Extraídos"):
+            extracted_frames_img = gr.Image(label="Visualização dos Frames em Grade")
         with gr.TabItem("1. Fidelidade e Coerência"):
             plot_fidelidade = gr.Image(label="Gráfico de Análise de Fidelidade (SSIM e pHash)")
         with gr.TabItem("2. Cor e Iluminação"):
         with gr.TabItem("5. Inteligência Adaptativa"):
             plot_semantico = gr.Image(label="Gráfico de Estresse Semântico")
     analyze_button.click(
         fn=run_full_analysis,
         inputs=[video_input, descriptions_input, start_frame_input, end_frame_input],
+        outputs=[extracted_frames_img, plot_fidelidade, plot_cor, plot_foco, plot_semantico, anomalias_plot_path]
     )
 if __name__ == "__main__":