Spaces:

ModuMLTECH
/

projet_trafic_2

Sleeping

App Files Files Community

projet_trafic_2 / app.py

ModuMLTECH

Update app.py

b683266 verified 4 months ago

raw

history blame contribute delete

24.1 kB

	import streamlit as st
	import cv2
	import tempfile
	import os
	import time
	import numpy as np
	from ultralytics import YOLO
	import threading
	from PIL import Image
	import torch

	# --- FONCTIONS UTILES ---
	def draw_text_with_background(
	image,
	text,
	position,
	font=cv2.FONT_HERSHEY_SIMPLEX,
	font_scale=1,
	font_thickness=2,
	text_color=(255, 255, 255),
	bg_color=(0, 0, 0),
	padding=5,
	):
	"""Ajoute du texte avec un fond sur une image OpenCV (bornes sécurisées)."""
	(text_width, text_height), _ = cv2.getTextSize(text, font, font_scale, font_thickness)
	x, y = position
	tl_x = max(0, x)
	tl_y = max(0, y - text_height - padding)
	br_x = min(image.shape[1] - 1, x + text_width + padding * 2)
	br_y = min(image.shape[0] - 1, y + padding)

	cv2.rectangle(image, (tl_x, tl_y), (br_x, br_y), bg_color, -1)
	cv2.putText(
	image,
	text,
	(tl_x + padding, min(y, image.shape[0] - 1)),
	font,
	font_scale,
	text_color,
	font_thickness,
	cv2.LINE_AA,
	)


	# --- CLASSE YOLO OPTIMISÉE ---
	class YOLOVideoProcessor:
	def __init__(self, model_path, poly1, poly2, tracker_method="bot"):
	# Device
	self.device = "cuda" if torch.cuda.is_available() else "cpu"

	# Paramètres d'optimisation
	self.frame_skip = 2
	self.downsample_factor = 0.5
	self.img_size = 640
	self.conf_threshold = 0.35

	# Modèle
	self.model = YOLO(model_path)
	self.model.to(self.device)

	# Tracking
	self.tracker_method = tracker_method
	self.tracker_config = "botsort.yaml" if self.tracker_method.lower() == "bot" else "bytetrack.yaml"

	# États
	self.unique_region1_ids = set()
	self.unique_region2_ids = set()
	self.poly1 = poly1
	self.poly2 = poly2
	self.stop_processing = False
	self.last_processed_frame = None
	self.current_frame = 0

	# Paramètres anti-duplicata pour camions longs
	self.iou_threshold = 0.3 # Seuil IoU pour fusionner les détections proches
	self.min_box_area = 500 # Surface minimale pour être considéré comme véhicule
	self.max_aspect_ratio = 5.0 # Ratio hauteur/largeur max pour éviter détections étirées

	# Historique des détections pour filtrage temporel
	self.detection_history = {} # {track_id: {'boxes': [], 'frames': []}}
	self.history_length = 5 # Nombre de frames à garder en mémoire

	@staticmethod
	def is_in_region(center, poly):
	poly_np = np.array(poly, dtype=np.int32)
	return cv2.pointPolygonTest(poly_np, center, False) >= 0

	def reset_counts(self):
	self.unique_region1_ids.clear()
	self.unique_region2_ids.clear()
	self.detection_history.clear()

	def _pick_fourcc(self, output_path):
	ext = os.path.splitext(output_path)[1].lower()
	if ext == ".mp4":
	return cv2.VideoWriter_fourcc(*"mp4v")
	return cv2.VideoWriter_fourcc(*"XVID")

	def calculate_iou(self, box1, box2):
	"""Calcule l'IoU (Intersection over Union) entre deux boîtes"""
	x1_min, y1_min, x1_max, y1_max = box1
	x2_min, y2_min, x2_max, y2_max = box2

	# Intersection
	inter_x_min = max(x1_min, x2_min)
	inter_y_min = max(y1_min, y2_min)
	inter_x_max = min(x1_max, x2_max)
	inter_y_max = min(y1_max, y2_max)

	inter_area = max(0, inter_x_max - inter_x_min) * max(0, inter_y_max - inter_y_min)

	# Union
	box1_area = (x1_max - x1_min) * (y1_max - y1_min)
	box2_area = (x2_max - x2_min) * (y2_max - y2_min)
	union_area = box1_area + box2_area - inter_area

	if union_area == 0:
	return 0

	return inter_area / union_area

	def filter_overlapping_detections(self, boxes_coords, track_ids, confidences):
	"""Filtre les détections qui se chevauchent (ex: plusieurs détections sur un camion)"""
	if len(boxes_coords) == 0:
	return [], [], []

	# Créer une liste de détections avec leurs indices
	detections = []
	for i, (box, tid, conf) in enumerate(zip(boxes_coords, track_ids, confidences)):
	x_min, y_min, x_max, y_max = box
	area = (x_max - x_min) * (y_max - y_min)
	aspect_ratio = (y_max - y_min) / max(1, x_max - x_min)

	# Filtrer les détections trop petites ou avec un aspect ratio bizarre
	if area < self.min_box_area or aspect_ratio > self.max_aspect_ratio:
	continue

	detections.append({
	'index': i,
	'box': box,
	'track_id': tid,
	'conf': conf,
	'area': area
	})

	# Trier par confiance décroissante
	detections.sort(key=lambda x: x['conf'], reverse=True)

	# Non-Maximum Suppression manuel
	keep_indices = []
	while len(detections) > 0:
	# Garder la détection avec la plus haute confiance
	best = detections.pop(0)
	keep_indices.append(best['index'])

	# Supprimer les détections qui se chevauchent trop avec la meilleure
	filtered_detections = []
	for det in detections:
	iou = self.calculate_iou(best['box'], det['box'])
	if iou < self.iou_threshold: # Garder si IoU faible (pas de chevauchement)
	filtered_detections.append(det)

	detections = filtered_detections

	# Retourner les détections filtrées
	filtered_boxes = [boxes_coords[i] for i in keep_indices]
	filtered_ids = [track_ids[i] for i in keep_indices]
	filtered_confs = [confidences[i] for i in keep_indices]

	return filtered_boxes, filtered_ids, filtered_confs

	def update_detection_history(self, track_id, box, frame_num):
	"""Met à jour l'historique des détections pour un véhicule"""
	if track_id not in self.detection_history:
	self.detection_history[track_id] = {'boxes': [], 'frames': []}

	self.detection_history[track_id]['boxes'].append(box)
	self.detection_history[track_id]['frames'].append(frame_num)

	# Garder seulement les N dernières frames
	if len(self.detection_history[track_id]['boxes']) > self.history_length:
	self.detection_history[track_id]['boxes'].pop(0)
	self.detection_history[track_id]['frames'].pop(0)

	def is_stable_detection(self, track_id):
	"""Vérifie si une détection est stable (pas un faux positif temporaire)"""
	if track_id not in self.detection_history:
	return False

	# Considérer stable si détecté sur au moins 3 frames
	return len(self.detection_history[track_id]['boxes']) >= 3

	def process_video(self, video_path, output_path, progress_bar=None):
	"""Traite une vidéo enregistrée avec optimisations"""
	cap = cv2.VideoCapture(video_path)
	if not cap.isOpened():
	st.error("⚠️ Erreur : Impossible d'ouvrir la vidéo.")
	return

	frame_width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
	frame_height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
	fps = cap.get(cv2.CAP_PROP_FPS)
	if not fps or fps <= 1e-3:
	fps = 30.0

	fourcc = self._pick_fourcc(output_path)
	out = cv2.VideoWriter(output_path, fourcc, fps, (frame_width, frame_height))
	if not out.isOpened():
	st.error("⚠️ Erreur : Impossible d'ouvrir la vidéo de sortie (codec).")
	cap.release()
	return

	self.reset_counts()
	processed_frames = 0
	total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
	frame_count = 0

	while cap.isOpened():
	success, frame = cap.read()
	if not success:
	break

	# Progression
	if progress_bar is not None and total_frames > 0:
	progress = min(1.0, processed_frames / float(total_frames))
	progress_bar.progress(progress)

	# Skip de frames
	if frame_count % self.frame_skip == 0:
	processed_frame = self.process_frame(frame, frame_count)
	self.last_processed_frame = processed_frame
	else:
	processed_frame = self.last_processed_frame if self.last_processed_frame is not None else frame

	if processed_frame is None:
	processed_frame = frame

	# S'assurer de la taille attendue
	if processed_frame.shape[1] != frame_width or processed_frame.shape[0] != frame_height:
	processed_frame = cv2.resize(processed_frame, (frame_width, frame_height), interpolation=cv2.INTER_AREA)

	out.write(processed_frame)
	processed_frames += 1
	frame_count += 1

	cap.release()
	out.release()
	cv2.destroyAllWindows()

	if processed_frames == 0:
	st.error("⚠️ Aucune image n'a été écrite dans la vidéo de sortie !")

	return len(self.unique_region1_ids), len(self.unique_region2_ids)

	def process_frame(self, frame, frame_num=0):
	"""Traite une image individuelle avec YOLO et le tracking, avec filtrage anti-duplicata"""
	if frame is None:
	return None

	# Redimensionner l'image pour accélérer le traitement
	orig_height, orig_width = frame.shape[:2]
	resized_width, resized_height = orig_width, orig_height
	if self.downsample_factor < 1.0:
	resized_width = max(1, int(orig_width * self.downsample_factor))
	resized_height = max(1, int(orig_height * self.downsample_factor))
	resized_frame = cv2.resize(frame, (resized_width, resized_height), interpolation=cv2.INTER_AREA)
	else:
	resized_frame = frame

	# Détection + tracking
	with torch.no_grad():
	results = self.model.track(
	resized_frame,
	persist=True,
	tracker=self.tracker_config,
	conf=self.conf_threshold,
	imgsz=self.img_size,
	device=self.device,
	classes=[2, 5, 7], # COCO: 2=car, 5=bus, 7=truck (évite autres objets)
	verbose=False
	)

	display_frame = frame.copy()
	frame_height, frame_width = display_frame.shape[:2]

	# Dessiner les polygones
	cv2.polylines(display_frame, [np.array(self.poly1, np.int32)], isClosed=True, color=(0, 255, 0), thickness=2)
	cv2.polylines(display_frame, [np.array(self.poly2, np.int32)], isClosed=True, color=(255, 0, 0), thickness=2)

	# Échelle pour remonter aux coords originales
	scale_x = orig_width / float(resized_width)
	scale_y = orig_height / float(resized_height)

	if results and len(results) > 0 and getattr(results[0], "boxes", None) is not None:
	try:
	boxes = results[0].boxes.xywh.cpu().numpy()
	ids_tensor = results[0].boxes.id
	confs = results[0].boxes.conf.cpu().numpy()

	if ids_tensor is None:
	track_ids = [None] * len(boxes)
	else:
	track_ids = ids_tensor.int().cpu().tolist()

	# Convertir les boîtes en format [x_min, y_min, x_max, y_max]
	boxes_coords = []
	for x, y, w, h in boxes:
	center_x = int(x * scale_x)
	center_y = int(y * scale_y)
	width = int(w * scale_x)
	height = int(h * scale_y)
	x_min = max(0, center_x - width // 2)
	y_min = max(0, center_y - height // 2)
	x_max = min(frame_width - 1, center_x + width // 2)
	y_max = min(frame_height - 1, center_y + height // 2)
	boxes_coords.append([x_min, y_min, x_max, y_max])

	# Filtrer les détections qui se chevauchent
	filtered_boxes, filtered_ids, filtered_confs = self.filter_overlapping_detections(
	boxes_coords, track_ids, confs
	)

	# Traiter les détections filtrées
	for box, track_id, conf in zip(filtered_boxes, filtered_ids, filtered_confs):
	if track_id is None:
	continue

	x_min, y_min, x_max, y_max = box
	center_x = (x_min + x_max) // 2
	center_y = (y_min + y_max) // 2
	center_point = (center_x, center_y)

	# Mettre à jour l'historique
	self.update_detection_history(track_id, box, frame_num)

	# Compter seulement les détections stables
	if self.is_stable_detection(track_id):
	if self.is_in_region(center_point, self.poly1):
	self.unique_region1_ids.add(track_id)
	if self.is_in_region(center_point, self.poly2):
	self.unique_region2_ids.add(track_id)

	# Dessiner la boîte (vert si stable, jaune sinon)
	color = (0, 255, 0) if self.is_stable_detection(track_id) else (0, 255, 255)
	cv2.rectangle(display_frame, (x_min, y_min), (x_max, y_max), color, 2)

	# Afficher l'ID et la confiance
	label = f"ID:{track_id} {conf:.2f}"
	cv2.putText(display_frame, label, (x_min, y_min - 10),
	cv2.FONT_HERSHEY_SIMPLEX, 0.5, color, 2)

	except Exception as e:
	draw_text_with_background(display_frame, f"Tracking error: {e}", (10, 60), bg_color=(80, 0, 0))

	# Affichage du comptage
	# draw_text_with_background(display_frame, f"Total Sens 1: {len(self.unique_region1_ids)}", (10, frame_height - 50))
	draw_text_with_background(display_frame, f"Total: {len(self.unique_region2_ids)}", (frame_width - 300, frame_height - 50))

	return display_frame

	def process_webcam(self, camera_id=0, display_placeholder=None, count_placeholders=None):
	"""Traite la vidéo en temps réel depuis une webcam"""
	cap = cv2.VideoCapture(camera_id)
	if not cap.isOpened():
	st.error("⚠️ Erreur : Impossible d'ouvrir la webcam.")
	return

	try:
	cap.set(cv2.CAP_PROP_FRAME_WIDTH, 640)
	cap.set(cv2.CAP_PROP_FRAME_HEIGHT, 480)
	cap.set(cv2.CAP_PROP_FPS, 30)
	except Exception:
	pass

	self.reset_counts()
	self.stop_processing = False
	frame_count = 0
	last_ts = time.time()

	while not self.stop_processing:
	success, frame = cap.read()
	if not success:
	st.error("⚠️ Erreur lors de la lecture du flux vidéo.")
	break

	if frame_count % self.frame_skip == 0:
	processed_frame = self.process_frame(frame, frame_count)
	self.last_processed_frame = processed_frame
	now = time.time()
	dt = max(1e-6, now - last_ts)
	fps = 1.0 / dt
	last_ts = now
	if processed_frame is not None:
	draw_text_with_background(processed_frame, f"FPS: {fps:.1f}", (10, 30))
	else:
	processed_frame = self.last_processed_frame if self.last_processed_frame is not None else frame

	if processed_frame is not None:
	try:
	processed_frame_rgb = cv2.cvtColor(processed_frame, cv2.COLOR_BGR2RGB)
	except Exception:
	processed_frame_rgb = processed_frame
	img = Image.fromarray(processed_frame_rgb)

	if display_placeholder:
	display_placeholder.image(img, channels="RGB", use_column_width=True)

	if count_placeholders and len(count_placeholders) >= 2:
	count_placeholders[0].metric("Véhicules Sens 1 (Vert)", len(self.unique_region1_ids))
	count_placeholders[1].metric("Véhicules Sens 2 (Rouge)", len(self.unique_region2_ids))

	frame_count += 1
	time.sleep(0.01)

	cap.release()
	st.success("✅ Flux vidéo arrêté.")


	# --- INTERFACE STREAMLIT ---
	def main():
	st.set_page_config(
	page_title="Détecteur de Véhicules",
	page_icon="🚗",
	layout="wide"
	)

	st.title("🚗 Détection et comptage de Véhicules sur l'Autoroute de l'Avenir")

	# Session state
	st.session_state.setdefault("webcam_active", False)
	st.session_state.setdefault("processor", None)

	# Modèle
	model_path = "best.pt"
	if not os.path.exists(model_path):
	with st.spinner("📥 Chargement du modèle YOLO..."):
	try:
	from huggingface_hub import hf_hub_download
	model_path = hf_hub_download(repo_id="ModuMLTECH/Trafic_congestion", filename="best.pt")
	st.success("✅ Modèle chargé depuis Hugging Face Hub.")
	except Exception as e:
	st.error(f"❌ Erreur lors du chargement du modèle: {e}")
	st.warning("⚠️ Utilisation du modèle YOLO public à la place (yolov8n.pt).")
	model_path = "yolov8n.pt"

	# Tabs
	tab1, tab2 = st.tabs(["📹 Analyse de Vidéo", "🎥 Détection en Temps Réel"])

	# Sidebar
	with st.sidebar:
	st.header("🔹 Paramètres")

	st.subheader("📍 Polygone 1 (vert)")
	poly1_input = st.text_area("Entrez 4 points (x,y) séparés par des espaces", "0,0 0,0 0,0 0,0")

	st.subheader("📍 Polygone 2 (rouge)")
	poly2_input = st.text_area("Entrez 4 points (x,y) séparés par des espaces", "500,150 700,150 1100,530 630,530")

	tracker_method = st.selectbox("Méthode de tracking", ["bot", "byte"], index=0)

	st.subheader("🚀 Paramètres d'optimisation")
	frame_skip = st.slider("Skip de frames", 1, 5, 2)
	downsample = st.slider("Facteur d'échelle", 0.3, 1.0, 0.5, 0.1)
	conf_threshold = st.slider("Seuil de confiance", 0.1, 0.9, 0.35, 0.05)

	st.subheader("🔧 Anti-duplicata")
	iou_thresh = st.slider("Seuil IoU (fusion détections)", 0.1, 0.9, 0.3, 0.05)
	min_area = st.slider("Surface minimale (pixels²)", 100, 2000, 500, 100)

	def parse_polygon(input_text):
	try:
	pts = []
	for token in input_text.replace(";", " ").split():
	x, y = token.split(",")
	pts.append((int(x), int(y)))
	return pts
	except Exception:
	return []

	poly1 = parse_polygon(poly1_input)
	poly2 = parse_polygon(poly2_input)
	valid_polygons = len(poly1) == 4 and len(poly2) == 4

	# Onglet 1: Analyse vidéo
	with tab1:
	uploaded_file = st.file_uploader("📂 Upload une vidéo", type=["mp4", "avi", "mkv", "mov"])
	if uploaded_file is not None:
	temp_dir = tempfile.mkdtemp()
	ext = os.path.splitext(uploaded_file.name)[1].lower() or ".mp4"
	input_video_path = os.path.join(temp_dir, f"input_video{ext}")
	output_video_path = os.path.join(temp_dir, f"output_video{ext}")

	with open(input_video_path, "wb") as f:
	f.write(uploaded_file.getbuffer())

	st.video(input_video_path)

	if st.button("▶️ Lancer la détection"):
	if valid_polygons:
	progress_bar = st.progress(0)
	processor = YOLOVideoProcessor(model_path, poly1, poly2, tracker_method)
	processor.frame_skip = frame_skip
	processor.downsample_factor = downsample
	processor.conf_threshold = conf_threshold
	processor.iou_threshold = iou_thresh
	processor.min_box_area = min_area

	start_time = time.time()
	counts = processor.process_video(input_video_path, output_video_path, progress_bar=progress_bar)
	end_time = time.time()
	if counts:
	count1, count2 = counts
	st.success(f"✅ Traitement terminé en {end_time - start_time:.2f} s")

	col_result1, col_result2 = st.columns(2)
	col_result1.metric("Véhicules Sens 1 (Vert)", count1)
	col_result2.metric("Véhicules Sens 2 (Rouge)", count2)

	st.subheader("Vidéo traitée")
	st.video(output_video_path)

	with open(output_video_path, "rb") as file:
	st.download_button(
	label="⬇️ Télécharger la vidéo",
	data=file,
	file_name=f"video_traitee{ext}",
	mime=f"video/{ext.strip('.')}",
	)
	else:
	st.error("❌ Les coordonnées des polygones doivent contenir exactement 4 points.")

	# Onglet 2: Webcam
	with tab2:
	st.header("Détection en Temps Réel avec Webcam")

	camera_options = {"Webcam par défaut": 0}
	for i in range(1, 5):
	try:
	cap = cv2.VideoCapture(i)
	if cap.isOpened():
	camera_options[f"Caméra {i}"] = i
	cap.release()
	except Exception:
	pass

	selected_camera = st.selectbox("Sélectionnez la source vidéo", list(camera_options.keys()))
	camera_id = camera_options[selected_camera]

	video_placeholder = st.empty()
	col1, col2 = st.columns(2)
	count_placeholders = [col1.empty(), col2.empty()]

	st.info("ℹ️ Optimisations: redimensionnement, skip de frames, filtrage anti-duplicata, CUDA si disponible.")

	col_start, col_stop = st.columns(2)

	if col_start.button("▶️ Démarrer la détection en direct"):
	if not valid_polygons:
	st.error("❌ Les coordonnées des polygones doivent contenir exactement 4 points.")
	elif st.session_state.webcam_active:
	st.warning("⚠️ La webcam est déjà active !")
	else:
	processor = YOLOVideoProcessor(model_path, poly1, poly2, tracker_method)
	processor.frame_skip = frame_skip
	processor.downsample_factor = downsample
	processor.conf_threshold = conf_threshold
	processor.iou_threshold = iou_thresh
	processor.min_box_area = min_area

	st.session_state.processor = processor
	st.session_state.webcam_active = True

	threading.Thread(
	target=st.session_state.processor.process_webcam,
	args=(camera_id, video_placeholder, count_placeholders),
	daemon=True,
	).start()

	if col_stop.button("⏹️ Arrêter la détection"):
	if st.session_state.webcam_active and st.session_state.processor:
	st.session_state.processor.stop_processing = True
	st.session_state.webcam_active = False
	time.sleep(0.5)
	video_placeholder.empty()
	else:
	st.warning("⚠️ Aucune détection en cours !")


	if __name__ == "__main__":
	main()