Spaces:

marcuscanhaco
/

weapon-detection-app

Runtime error

App Files Files Community

Marcus Vinicius Zerbini Canhaço commited on Feb 13, 2025

Commit

1ccfc24

1 Parent(s): 62fec37

feat: atualização do detector com otimizações para GPU T4

Browse files

Files changed (4) hide show

src/domain/detectors/base.py +1 -1
src/domain/detectors/gpu.py +48 -6
src/main.py +82 -69
src/presentation/web/gradio_interface.py +9 -9

src/domain/detectors/base.py CHANGED Viewed

@@ -155,7 +155,7 @@ class BaseDetector(ABC):
         """Retorna as queries otimizadas para detecção de objetos perigosos."""
         firearms = ["handgun", "rifle", "shotgun", "machine gun", "firearm"]
         edged_weapons = ["knife", "dagger", "machete", "box cutter", "sword"]
-        ranged_weapons = ["crossbow", "bow"]
         sharp_objects = ["blade", "razor", "glass shard", "screwdriver", "metallic pointed object"]
         firearm_contexts = ["close-up", "clear view", "detailed"]

         """Retorna as queries otimizadas para detecção de objetos perigosos."""
         firearms = ["handgun", "rifle", "shotgun", "machine gun", "firearm"]
         edged_weapons = ["knife", "dagger", "machete", "box cutter", "sword"]
+        ranged_weapons = ["crossbow", "bow","arrow"]
         sharp_objects = ["blade", "razor", "glass shard", "screwdriver", "metallic pointed object"]
         firearm_contexts = ["close-up", "clear view", "detailed"]

src/domain/detectors/gpu.py CHANGED Viewed

@@ -9,6 +9,7 @@ from PIL import Image
 from typing import List, Dict, Any, Tuple
 from transformers import Owlv2Processor, Owlv2ForObjectDetection
 from .base import BaseDetector
 logger = logging.getLogger(__name__)
@@ -48,6 +49,8 @@ class WeaponDetectorGPU(BaseDetector):
             # Processar queries
             self.text_queries = self._get_detection_queries()
             self.processed_text = self.owlv2_processor(
                 text=self.text_queries,
                 return_tensors="pt",
@@ -101,12 +104,17 @@ class WeaponDetectorGPU(BaseDetector):
                 labels = results["labels"]
                 for score, box, label in zip(scores, boxes, labels):
-                    if score.item() >= threshold:
                         detections.append({
-                            "confidence": score.item(),
                             "box": [int(x) for x in box.tolist()],
-                            "label": self.text_queries[label]
                         })
             # Aplicar NMS nas detecções
             detections = self._apply_nms(detections)
@@ -131,25 +139,59 @@ class WeaponDetectorGPU(BaseDetector):
         """Processa um vídeo."""
         metrics = {
             "total_time": 0,
             "frames_analyzed": 0,
             "detections": []
         }
         try:
             frames = self.extract_frames(video_path, fps or 2, resolution)
             metrics["frames_analyzed"] = len(frames)
             for i, frame in enumerate(frames):
                 frame_rgb = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
                 frame_pil = Image.fromarray(frame_rgb)
                 detections = self.detect_objects(frame_pil, threshold)
-                if detections:
                     metrics["detections"].append({
                         "frame": i,
-                        "detections": detections
                     })
-                    return video_path, metrics
             return video_path, metrics

 from typing import List, Dict, Any, Tuple
 from transformers import Owlv2Processor, Owlv2ForObjectDetection
 from .base import BaseDetector
+import time
 logger = logging.getLogger(__name__)
             # Processar queries
             self.text_queries = self._get_detection_queries()
+            logger.info(f"Queries carregadas: {self.text_queries}")  # Log das queries
             self.processed_text = self.owlv2_processor(
                 text=self.text_queries,
                 return_tensors="pt",
                 labels = results["labels"]
                 for score, box, label in zip(scores, boxes, labels):
+                    score_val = score.item()
+                    if score_val >= threshold:
+                        # Garantir que o índice está dentro dos limites
+                        label_idx = min(label.item(), len(self.text_queries) - 1)
+                        label_text = self.text_queries[label_idx]
                         detections.append({
+                            "confidence": round(score_val * 100, 2),  # Converter para porcentagem
                             "box": [int(x) for x in box.tolist()],
+                            "label": label_text
                         })
+                        logger.debug(f"Detecção: {label_text} ({score_val * 100:.2f}%)")
             # Aplicar NMS nas detecções
             detections = self._apply_nms(detections)
         """Processa um vídeo."""
         metrics = {
             "total_time": 0,
+            "frame_extraction_time": 0,
+            "analysis_time": 0,
             "frames_analyzed": 0,
+            "video_duration": 0,
+            "device_type": "GPU",
             "detections": []
         }
         try:
+            start_time = time.time()
+            # Extrair frames
+            t0 = time.time()
             frames = self.extract_frames(video_path, fps or 2, resolution)
+            metrics["frame_extraction_time"] = time.time() - t0
             metrics["frames_analyzed"] = len(frames)
+            if not frames:
+                logger.warning("Nenhum frame extraído do vídeo")
+                return video_path, metrics
+            # Calcular duração do vídeo
+            metrics["video_duration"] = len(frames) / (fps or 2)
+            # Processar frames
+            t0 = time.time()
             for i, frame in enumerate(frames):
                 frame_rgb = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
                 frame_pil = Image.fromarray(frame_rgb)
                 detections = self.detect_objects(frame_pil, threshold)
+                # Filtrar apenas detecções válidas (sem filtrar unknown)
+                valid_detections = [
+                    {
+                        "confidence": d["confidence"],
+                        "box": d["box"],
+                        "label": d["label"],
+                        "timestamp": i / (fps or 2)
+                    }
+                    for d in detections
+                    if d["confidence"] > threshold
+                ]
+                if valid_detections:
                     metrics["detections"].append({
                         "frame": i,
+                        "detections": valid_detections
                     })
+            # Atualizar métricas finais
+            metrics["analysis_time"] = time.time() - t0
+            metrics["total_time"] = time.time() - start_time
             return video_path, metrics

src/main.py CHANGED Viewed

@@ -4,6 +4,7 @@ from src.presentation.web.gradio_interface import GradioInterface
 import logging
 import torch
 import gc
 from src.domain.factories.detector_factory import force_gpu_init, is_gpu_available
 # Configurar logging
@@ -13,78 +14,83 @@ logging.basicConfig(
 )
 logger = logging.getLogger(__name__)
-def check_cuda_environment():
-    """Verifica e configura o ambiente CUDA."""
     try:
-        # Verificar variáveis de ambiente CUDA
-        cuda_path = os.getenv('CUDA_HOME') or os.getenv('CUDA_PATH')
-        if not cuda_path:
-            logger.warning("Variáveis de ambiente CUDA não encontradas")
-            return False
-        # Verificar se CUDA está disponível no PyTorch
-        if not torch.cuda.is_available():
-            logger.warning("PyTorch não detectou CUDA")
-            return False
-        # Tentar obter informações da GPU
-        try:
-            device_count = torch.cuda.device_count()
-            if device_count > 0:
-                device_name = torch.cuda.get_device_name(0)
-                logger.info(f"GPU detectada: {device_name}")
-                return True
-        except Exception as e:
-            logger.warning(f"Erro ao obter informações da GPU: {str(e)}")
-        return False
     except Exception as e:
-        logger.error(f"Erro ao verificar ambiente CUDA: {str(e)}")
-        return False
-def setup_zero_gpu():
-    """Configurações otimizadas para Zero-GPU."""
     try:
-        # Verificar ambiente CUDA primeiro
-        if not check_cuda_environment():
-            logger.warning("Ambiente CUDA não está configurado corretamente")
             return False
-        # Tentar inicializar GPU
-        if is_gpu_available():
-            # Configurar ambiente
-            os.environ['CUDA_DEVICE_ORDER'] = 'PCI_BUS_ID'
-            os.environ['CUDA_VISIBLE_DEVICES'] = '0'
-            # Limpar memória
-            torch.cuda.empty_cache()
-            gc.collect()
-            # Configurações de memória e performance
-            os.environ['PYTORCH_CUDA_ALLOC_CONF'] = 'max_split_size_mb:128'
             torch.backends.cuda.matmul.allow_tf32 = True
             torch.backends.cudnn.benchmark = True
             torch.backends.cudnn.allow_tf32 = True
-            # Configurar fração de memória
             torch.cuda.set_per_process_memory_fraction(0.9)
-            # Verificar se a configuração foi bem sucedida
-            try:
-                device = torch.device('cuda')
-                dummy = torch.zeros(1, device=device)
-                del dummy
-                logger.info(f"Configurações Zero-GPU aplicadas com sucesso na GPU: {torch.cuda.get_device_name(0)}")
-                return True
-            except Exception as e:
-                logger.error(f"Erro ao configurar GPU: {str(e)}")
-                return False
-        else:
-            logger.warning("GPU não disponível para configuração Zero-GPU. O sistema operará em modo CPU.")
             return False
     except Exception as e:
-        logger.error(f"Erro ao configurar Zero-GPU: {str(e)}")
-        logger.warning("Fallback para modo CPU devido a erro na configuração da GPU.")
         return False
 def main():
@@ -97,7 +103,15 @@ def main():
         if IS_HUGGINGFACE:
             load_dotenv('.env.huggingface')
             logger.info("Ambiente HuggingFace detectado")
-            gpu_available = setup_zero_gpu()
         else:
             load_dotenv('.env')
             logger.info("Ambiente local detectado")
@@ -108,21 +122,20 @@ def main():
         demo = interface.create_interface()
         if IS_HUGGINGFACE:
-            # Configurar com base na disponibilidade da GPU
-            if gpu_available:
-                gpu_mem = torch.cuda.get_device_properties(0).total_memory / (1024**3)
-                max_concurrent = 1  # Forçar single worker para Zero-GPU
-                logger.info(f"GPU Memory: {gpu_mem:.1f}GB, Max Concurrent: {max_concurrent}")
             else:
-                max_concurrent = 1
-                logger.warning("GPU não disponível. O sistema está operando em modo CPU. " +
-                             "Todas as funcionalidades estão disponíveis, mas o processamento será mais lento.")
             # Configurar fila
             demo = demo.queue(
                 api_open=False,
                 status_update_rate="auto",
-                max_size=5  # Reduzir tamanho da fila para economizar memória
             )
             # Launch
@@ -130,7 +143,7 @@ def main():
                 server_name="0.0.0.0",
                 server_port=7860,
                 share=False,
-                max_threads=2  # Reduzir número de threads
             )
         else:
             demo.launch(

 import logging
 import torch
 import gc
+import nvidia_smi
 from src.domain.factories.detector_factory import force_gpu_init, is_gpu_available
 # Configurar logging
 )
 logger = logging.getLogger(__name__)
+def check_gpu_type():
+    """Verifica o tipo de GPU disponível no ambiente Hugging Face."""
     try:
+        nvidia_smi.nvmlInit()
+        handle = nvidia_smi.nvmlDeviceGetHandleByIndex(0)
+        info = nvidia_smi.nvmlDeviceGetMemoryInfo(handle)
+        gpu_name = nvidia_smi.nvmlDeviceGetName(handle)
+        total_memory = info.total / (1024**3)  # Converter para GB
+        logger.info(f"GPU detectada: {gpu_name}")
+        logger.info(f"Memória total: {total_memory:.2f}GB")
+        # T4 dedicada tem tipicamente 16GB
+        if "T4" in gpu_name and total_memory > 14:
+            return "t4_dedicated"
+        # Zero-GPU compartilhada tem tipicamente menos memória
+        elif total_memory < 14:
+            return "zero_gpu_shared"
+        else:
+            return "unknown"
     except Exception as e:
+        logger.error(f"Erro ao verificar tipo de GPU: {str(e)}")
+        return "unknown"
+    finally:
+        try:
+            nvidia_smi.nvmlShutdown()
+        except:
+            pass
+def setup_gpu_environment(gpu_type: str) -> bool:
+    """Configura o ambiente GPU com base no tipo detectado."""
     try:
+        # Verificar ambiente CUDA
+        if not torch.cuda.is_available():
+            logger.warning("CUDA não está disponível")
             return False
+        # Configurações comuns
+        os.environ['CUDA_DEVICE_ORDER'] = 'PCI_BUS_ID'
+        os.environ['CUDA_VISIBLE_DEVICES'] = '0'
+        # Limpar memória
+        torch.cuda.empty_cache()
+        gc.collect()
+        if gpu_type == "t4_dedicated":
+            # Configurações para T4 dedicada
+            logger.info("Configurando para T4 dedicada")
             torch.backends.cuda.matmul.allow_tf32 = True
             torch.backends.cudnn.benchmark = True
             torch.backends.cudnn.allow_tf32 = True
+            # Usar mais memória pois temos GPU dedicada
             torch.cuda.set_per_process_memory_fraction(0.9)
+            os.environ['PYTORCH_CUDA_ALLOC_CONF'] = 'max_split_size_mb:512'
+        elif gpu_type == "zero_gpu_shared":
+            # Configurações para Zero-GPU compartilhada
+            logger.info("Configurando para Zero-GPU compartilhada")
+            torch.backends.cudnn.benchmark = False
+            # Limitar uso de memória
+            torch.cuda.set_per_process_memory_fraction(0.6)
+            os.environ['PYTORCH_CUDA_ALLOC_CONF'] = 'max_split_size_mb:128'
+        # Verificar configuração
+        try:
+            device = torch.device('cuda')
+            dummy = torch.zeros(1, device=device)
+            del dummy
+            logger.info(f"Configurações GPU aplicadas com sucesso para: {gpu_type}")
+            return True
+        except Exception as e:
+            logger.error(f"Erro ao configurar GPU: {str(e)}")
             return False
     except Exception as e:
+        logger.error(f"Erro ao configurar ambiente GPU: {str(e)}")
         return False
 def main():
         if IS_HUGGINGFACE:
             load_dotenv('.env.huggingface')
             logger.info("Ambiente HuggingFace detectado")
+            # Identificar e configurar GPU
+            gpu_type = check_gpu_type()
+            gpu_available = setup_gpu_environment(gpu_type)
+            if gpu_available:
+                logger.info(f"GPU configurada com sucesso: {gpu_type}")
+            else:
+                logger.warning("GPU não disponível ou não configurada corretamente")
         else:
             load_dotenv('.env')
             logger.info("Ambiente local detectado")
         demo = interface.create_interface()
         if IS_HUGGINGFACE:
+            # Configurar com base no tipo de GPU
+            if gpu_type == "t4_dedicated":
+                max_concurrent = 2  # T4 pode lidar com mais requisições
+                queue_size = 10
             else:
+                max_concurrent = 1  # Zero-GPU precisa ser mais conservadora
+                queue_size = 5
             # Configurar fila
             demo = demo.queue(
                 api_open=False,
+                max_size=queue_size,
                 status_update_rate="auto",
+                concurrency_count=max_concurrent
             )
             # Launch
                 server_name="0.0.0.0",
                 server_port=7860,
                 share=False,
+                max_threads=max_concurrent
             )
         else:
             demo.launch(

src/presentation/web/gradio_interface.py CHANGED Viewed

@@ -228,23 +228,23 @@ class GradioInterface:
                     with gr.Row():
                         with gr.Column(scale=3):
                             gr.Markdown("#### Vídeo")
-                        with gr.Column(scale=1):
-                            gr.Markdown("#### Tipo")
                         with gr.Column(scale=1):
                             gr.Markdown("#### Ação")
                     for video in sample_videos:
                         with gr.Row():
-                            with gr.Column(scale=3):
-                                gr.Video(
                                     value=video['path'],
                                     format="mp4",
                                     height=150,
-                                    interactive=False,
-                                    show_label=False
-                                )
-                            with gr.Column(scale=1):
-                                gr.Markdown(video['ground_truth'])
                             with gr.Column(scale=1, min_width=100):
                                 gr.Button(
                                     "📥 Carregar",

                     with gr.Row():
                         with gr.Column(scale=3):
                             gr.Markdown("#### Vídeo")
                         with gr.Column(scale=1):
                             gr.Markdown("#### Ação")
                     for video in sample_videos:
                         with gr.Row():
+                            with gr.Column(scale=3):
+                                gr.PlayableVideo(
                                     value=video['path'],
                                     format="mp4",
                                     height=150,
+                                    interactive=True,
+                                    show_label=True).click(
+                                    fn=self.load_sample_video,
+                                    inputs=[gr.State(video['path'])],
+                                    outputs=[input_video]
+                                    )
                             with gr.Column(scale=1, min_width=100):
                                 gr.Button(
                                     "📥 Carregar",