Spaces:

blacksinisterx
/

DetectifAI-Backend

Running

App Files Files Community

DetectifAI-Backend / json_reports.py

blacksinisterx

fix: keyframe images, video clips, evidence images, live stream webcam+URL, remove demo mode

fd50325 verified 2 months ago

raw

history blame contribute delete

24.4 kB

	"""
	JSON Reports Generation Module

	This module handles:
	- Processing results JSON reports
	- Canonical events JSON
	- Segment analysis reports
	- Performance statistics
	- HTML gallery generation
	"""

	import json
	import os
	import cv2
	import base64
	from typing import Dict, List, Any, Optional
	from datetime import datetime
	import logging

	logger = logging.getLogger(__name__)

	class ReportGenerator:
	"""Generate comprehensive JSON reports and HTML galleries"""

	def __init__(self, config):
	self.config = config
	self.reports_dir = os.path.join(config.output_base_dir, "reports")
	os.makedirs(self.reports_dir, exist_ok=True)

	def generate_processing_results_report(self,
	keyframes: List,
	events: List,
	canonical_events: List,
	segments: List,
	processing_stats: Dict[str, Any]) -> str:
	"""Generate comprehensive processing results report"""

	logger.info("Generating processing results report")

	report = {
	'metadata': {
	'generation_timestamp': datetime.now().isoformat(),
	'report_version': '1.0',
	'processing_config': self._get_config_summary()
	},
	'summary': {
	'total_keyframes_extracted': len(keyframes),
	'total_events_detected': len(events),
	'canonical_events_created': len(canonical_events),
	'video_segments_created': len(segments),
	'processing_duration': processing_stats.get('total_processing_time', 0)
	},
	'keyframe_analysis': self._analyze_keyframes(keyframes),
	'event_analysis': self._analyze_events(events),
	'canonical_event_analysis': self._analyze_canonical_events(canonical_events),
	'segment_analysis': self._analyze_segments(segments),
	'performance_statistics': processing_stats,
	'quality_metrics': self._calculate_quality_metrics(keyframes, events)
	}

	# Save report
	output_path = os.path.join(self.reports_dir, "processing_results.json")

	try:
	with open(output_path, 'w') as f:
	json.dump(report, f, indent=2)

	logger.info(f"Processing results report saved: {output_path}")
	return output_path

	except Exception as e:
	logger.error(f"Failed to save processing results report: {e}")
	return ""

	def generate_canonical_events_report(self, canonical_events: List) -> str:
	"""Generate canonical events JSON report"""

	logger.info("Generating canonical events report")

	report = {
	'metadata': {
	'generation_timestamp': datetime.now().isoformat(),
	'total_canonical_events': len(canonical_events),
	'deduplication_threshold': self.config.similarity_threshold
	},
	'canonical_events': []
	}

	for event in canonical_events:
	event_data = {
	'canonical_id': event.canonical_id,
	'event_type': event.event_type,
	'representative_frame': event.representative_frame,
	'time_range': {
	'start_time': event.start_time,
	'end_time': event.end_time,
	'duration': event.duration
	},
	'confidence': event.confidence,
	'frame_count': event.frame_count,
	'aggregated_events': event.aggregated_events,
	'description': event.description,
	'similarity_cluster': event.similarity_cluster
	}
	report['canonical_events'].append(event_data)

	# Save report
	output_path = os.path.join(self.reports_dir, "canonical_events.json")

	try:
	with open(output_path, 'w') as f:
	json.dump(report, f, indent=2)

	logger.info(f"Canonical events report saved: {output_path}")
	return output_path

	except Exception as e:
	logger.error(f"Failed to save canonical events report: {e}")
	return ""

	def generate_segments_report(self, segments: List) -> str:
	"""Generate video segments analysis report"""

	logger.info("Generating video segments report")

	report = {
	'metadata': {
	'generation_timestamp': datetime.now().isoformat(),
	'total_segments': len(segments),
	'segment_duration': self.config.segment_duration,
	'keyframes_per_segment': self.config.keyframes_per_segment
	},
	'summary_statistics': self._get_segments_summary(segments),
	'segments': []
	}

	for segment in segments:
	segment_data = {
	'segment_id': segment.segment_id,
	'time_range': {
	'start_timestamp': segment.start_timestamp,
	'end_timestamp': segment.end_timestamp,
	'duration': segment.duration
	},
	'frame_range': {
	'start_frame': segment.start_frame,
	'end_frame': segment.end_frame
	},
	'segment_classification': {
	'segment_type': segment.segment_type,
	'activity_level': segment.activity_level
	},
	'statistics': {
	'motion_statistics': segment.motion_statistics,
	'quality_statistics': segment.quality_statistics,
	'keyframe_count': len(segment.keyframes)
	},
	'keyframes': segment.keyframes
	}
	report['segments'].append(segment_data)

	# Save report
	output_path = os.path.join(self.reports_dir, "video_segments.json")

	try:
	with open(output_path, 'w') as f:
	json.dump(report, f, indent=2)

	logger.info(f"Video segments report saved: {output_path}")
	return output_path

	except Exception as e:
	logger.error(f"Failed to save video segments report: {e}")
	return ""

	def generate_html_gallery(self, keyframes: List, canonical_events: List = None,
	segments: List = None, title: str = "Video Processing Gallery") -> str:
	"""Generate interactive HTML gallery of keyframes and events"""

	logger.info("Generating HTML gallery")

	html_content = self._create_html_gallery(keyframes, canonical_events, segments, title)

	# Save HTML gallery
	output_path = os.path.join(self.reports_dir, "canonical_gallery.html")

	try:
	with open(output_path, 'w', encoding='utf-8') as f:
	f.write(html_content)

	logger.info(f"HTML gallery saved: {output_path}")
	return output_path

	except Exception as e:
	logger.error(f"Failed to save HTML gallery: {e}")
	return ""

	def _get_config_summary(self) -> Dict[str, Any]:
	"""Get summary of configuration settings"""
	return {
	'base_quality_threshold': self.config.base_quality_threshold,
	'motion_threshold': self.config.motion_threshold,
	'event_importance_threshold': self.config.event_importance_threshold,
	'similarity_threshold': self.config.similarity_threshold,
	'segment_duration': self.config.segment_duration,
	'max_summary_frames': self.config.max_summary_frames,
	'output_resolution': self.config.output_resolution,
	'enable_clahe': self.config.enable_clahe,
	'enable_denoising': self.config.enable_denoising
	}

	def _analyze_keyframes(self, keyframes: List) -> Dict[str, Any]:
	"""Analyze keyframe extraction results"""
	if not keyframes:
	return {}

	# Extract metrics
	quality_scores = [kf.frame_data.quality_score for kf in keyframes]
	motion_scores = [kf.frame_data.motion_score for kf in keyframes]
	selection_reasons = [kf.selection_reason for kf in keyframes]
	burst_frames = [kf for kf in keyframes if kf.frame_data.burst_active]
	enhanced_frames = [kf for kf in keyframes if kf.frame_data.enhancement_applied]

	# Count selection reasons
	reason_counts = {}
	for reason in selection_reasons:
	reason_counts[reason] = reason_counts.get(reason, 0) + 1

	# Calculate statistics
	analysis = {
	'total_keyframes': len(keyframes),
	'quality_statistics': {
	'min': float(min(quality_scores)),
	'max': float(max(quality_scores)),
	'mean': float(sum(quality_scores) / len(quality_scores)),
	'std': float(np.std(quality_scores))
	},
	'motion_statistics': {
	'min': float(min(motion_scores)),
	'max': float(max(motion_scores)),
	'mean': float(sum(motion_scores) / len(motion_scores)),
	'std': float(np.std(motion_scores))
	},
	'selection_reason_distribution': reason_counts,
	'burst_frames_count': len(burst_frames),
	'enhanced_frames_count': len(enhanced_frames),
	'enhancement_rate': len(enhanced_frames) / len(keyframes) * 100
	}

	return analysis

	def _analyze_events(self, events: List) -> Dict[str, Any]:
	"""Analyze detected events"""
	if not events:
	return {}

	# Event type distribution
	event_types = [event.event_type for event in events]
	type_counts = {}
	for event_type in event_types:
	type_counts[event_type] = type_counts.get(event_type, 0) + 1

	# Confidence statistics
	confidences = [event.confidence for event in events]
	importance_scores = [event.importance_score for event in events]
	durations = [event.end_timestamp - event.start_timestamp for event in events]

	analysis = {
	'total_events': len(events),
	'event_type_distribution': type_counts,
	'confidence_statistics': {
	'min': float(min(confidences)),
	'max': float(max(confidences)),
	'mean': float(sum(confidences) / len(confidences))
	},
	'importance_statistics': {
	'min': float(min(importance_scores)),
	'max': float(max(importance_scores)),
	'mean': float(sum(importance_scores) / len(importance_scores))
	},
	'duration_statistics': {
	'min': float(min(durations)),
	'max': float(max(durations)),
	'mean': float(sum(durations) / len(durations))
	}
	}

	return analysis

	def _analyze_canonical_events(self, canonical_events: List) -> Dict[str, Any]:
	"""Analyze canonical events"""
	if not canonical_events:
	return {}

	# Type distribution
	event_types = [event.event_type for event in canonical_events]
	type_counts = {}
	for event_type in event_types:
	type_counts[event_type] = type_counts.get(event_type, 0) + 1

	# Statistics
	durations = [event.duration for event in canonical_events]
	frame_counts = [event.frame_count for event in canonical_events]
	confidences = [event.confidence for event in canonical_events]

	analysis = {
	'total_canonical_events': len(canonical_events),
	'event_type_distribution': type_counts,
	'duration_statistics': {
	'min': float(min(durations)),
	'max': float(max(durations)),
	'mean': float(sum(durations) / len(durations))
	},
	'frame_count_statistics': {
	'min': int(min(frame_counts)),
	'max': int(max(frame_counts)),
	'mean': float(sum(frame_counts) / len(frame_counts))
	},
	'confidence_statistics': {
	'min': float(min(confidences)),
	'max': float(max(confidences)),
	'mean': float(sum(confidences) / len(confidences))
	}
	}

	return analysis

	def _analyze_segments(self, segments: List) -> Dict[str, Any]:
	"""Analyze video segments"""
	if not segments:
	return {}

	# Type and activity distribution
	segment_types = [seg.segment_type for seg in segments]
	activity_levels = [seg.activity_level for seg in segments]

	type_counts = {}
	for seg_type in segment_types:
	type_counts[seg_type] = type_counts.get(seg_type, 0) + 1

	activity_counts = {}
	for activity in activity_levels:
	activity_counts[activity] = activity_counts.get(activity, 0) + 1

	analysis = {
	'total_segments': len(segments),
	'segment_type_distribution': type_counts,
	'activity_level_distribution': activity_counts,
	'average_segment_duration': float(sum(seg.duration for seg in segments) / len(segments)),
	'total_keyframes': sum(len(seg.keyframes) for seg in segments)
	}

	return analysis

	def _calculate_quality_metrics(self, keyframes: List, events: List) -> Dict[str, Any]:
	"""Calculate overall quality metrics"""
	if not keyframes:
	return {}

	# Coverage metrics
	total_frames_extracted = len(keyframes)
	burst_frames = len([kf for kf in keyframes if kf.frame_data.burst_active])
	high_quality_frames = len([kf for kf in keyframes if kf.frame_data.quality_score > self.config.base_quality_threshold * 1.2])
	high_motion_frames = len([kf for kf in keyframes if kf.frame_data.motion_score > self.config.motion_threshold])

	# Event coverage
	event_coverage = len(events) / total_frames_extracted if total_frames_extracted > 0 else 0

	metrics = {
	'frame_extraction_efficiency': {
	'total_frames_extracted': total_frames_extracted,
	'burst_frame_rate': burst_frames / total_frames_extracted * 100,
	'high_quality_frame_rate': high_quality_frames / total_frames_extracted * 100,
	'high_motion_frame_rate': high_motion_frames / total_frames_extracted * 100
	},
	'event_detection_efficiency': {
	'events_per_keyframe': event_coverage,
	'total_events_detected': len(events)
	},
	'processing_quality_score': self._calculate_overall_quality_score(keyframes, events)
	}

	return metrics

	def _calculate_overall_quality_score(self, keyframes: List, events: List) -> float:
	"""Calculate overall processing quality score (0-100)"""
	if not keyframes:
	return 0.0

	# Component scores
	avg_quality = sum(kf.frame_data.quality_score for kf in keyframes) / len(keyframes)
	avg_motion = sum(kf.frame_data.motion_score for kf in keyframes) / len(keyframes)
	burst_rate = len([kf for kf in keyframes if kf.frame_data.burst_active]) / len(keyframes)
	event_rate = len(events) / len(keyframes) if len(keyframes) > 0 else 0

	# Weighted combination
	quality_score = (
	avg_quality * 40 + # 40% weight on frame quality
	avg_motion * 30 + # 30% weight on motion detection
	burst_rate * 20 + # 20% weight on burst detection
	event_rate * 10 # 10% weight on event detection
	) * 100

	return min(100.0, quality_score)

	def _get_segments_summary(self, segments: List) -> Dict[str, Any]:
	"""Get summary statistics for segments"""
	if not segments:
	return {}

	# Activity level distribution
	activity_levels = [seg.activity_level for seg in segments]
	activity_counts = {}
	for level in activity_levels:
	activity_counts[level] = activity_counts.get(level, 0) + 1

	# Segment type distribution
	segment_types = [seg.segment_type for seg in segments]
	type_counts = {}
	for seg_type in segment_types:
	type_counts[seg_type] = type_counts.get(seg_type, 0) + 1

	return {
	'total_segments': len(segments),
	'activity_level_distribution': activity_counts,
	'segment_type_distribution': type_counts
	}

	def _create_html_gallery(self, keyframes: List, canonical_events: List = None,
	segments: List = None, title: str = "Video Processing Gallery") -> str:
	"""Create HTML gallery content"""

	html_template = f"""
	<!DOCTYPE html>
	<html lang="en">
	<head>
	<meta charset="UTF-8">
	<meta name="viewport" content="width=device-width, initial-scale=1.0">
	<title>{title}</title>
	<style>
	body {{ font-family: Arial, sans-serif; margin: 20px; background-color: #f5f5f5; }}
	.header {{ text-align: center; margin-bottom: 30px; }}
	.stats {{ display: flex; justify-content: space-around; margin-bottom: 30px; }}
	.stat-card {{ background: white; padding: 20px; border-radius: 8px; box-shadow: 0 2px 4px rgba(0,0,0,0.1); }}
	.gallery {{ display: grid; grid-template-columns: repeat(auto-fill, minmax(300px, 1fr)); gap: 20px; }}
	.frame-card {{ background: white; border-radius: 8px; overflow: hidden; box-shadow: 0 2px 4px rgba(0,0,0,0.1); }}
	.frame-image {{ width: 100%; height: 200px; object-fit: cover; }}
	.frame-info {{ padding: 15px; }}
	.frame-info h3 {{ margin: 0 0 10px 0; color: #333; }}
	.frame-info p {{ margin: 5px 0; color: #666; font-size: 14px; }}
	.event-badge {{ display: inline-block; padding: 3px 8px; border-radius: 12px; font-size: 12px; color: white; margin-right: 5px; }}
	.burst-activity {{ background-color: #e74c3c; }}
	.high-motion {{ background-color: #f39c12; }}
	.high-quality {{ background-color: #27ae60; }}
	.context-frame {{ background-color: #3498db; }}
	.timestamp {{ font-weight: bold; color: #2c3e50; }}
	.score {{ color: #8e44ad; font-weight: bold; }}
	</style>
	</head>
	<body>
	<div class="header">
	<h1>{title}</h1>
	<p>Generated on {datetime.now().strftime('%Y-%m-%d %H:%M:%S')}</p>
	</div>

	<div class="stats">
	<div class="stat-card">
	<h3>Keyframes</h3>
	<p>{len(keyframes)} extracted</p>
	</div>
	<div class="stat-card">
	<h3>Events</h3>
	<p>{len(canonical_events) if canonical_events else 0} canonical</p>
	</div>
	<div class="stat-card">
	<h3>Segments</h3>
	<p>{len(segments) if segments else 0} temporal</p>
	</div>
	</div>

	<div class="gallery">
	"""

	# Add keyframes to gallery
	for i, kf in enumerate(keyframes[:50]): # Limit to first 50 for performance
	try:
	frame_path = kf.frame_data.frame_path

	# Convert image to base64 for embedding
	image_data = ""
	if os.path.exists(frame_path):
	try:
	with open(frame_path, 'rb') as img_file:
	image_data = base64.b64encode(img_file.read()).decode('utf-8')
	except Exception as e:
	logger.warning(f"Could not encode image {frame_path}: {e}")

	# Format timestamp
	timestamp = kf.frame_data.timestamp
	mins = int(timestamp // 60)
	secs = timestamp % 60
	time_str = f"{mins:02d}:{secs:04.1f}"

	# Determine badge class
	badge_class = "context-frame"
	if kf.frame_data.burst_active:
	badge_class = "burst-activity"
	elif kf.frame_data.motion_score > self.config.motion_threshold:
	badge_class = "high-motion"
	elif kf.frame_data.quality_score > self.config.base_quality_threshold * 1.2:
	badge_class = "high-quality"

	html_template += f"""
	<div class="frame-card">
	{"<img class='frame-image' src='data:image/jpeg;base64," + image_data + "' alt='Keyframe " + str(i+1) + "'>" if image_data else "<div class='frame-image' style='background-color: #ddd; display: flex; align-items: center; justify-content: center;'>Image not available</div>"}
	<div class="frame-info">
	<h3>Frame {i+1}</h3>
	<p><span class="timestamp">Time: {time_str}</span></p>
	<p>Quality: <span class="score">{kf.frame_data.quality_score:.3f}</span></p>
	<p>Motion: <span class="score">{kf.frame_data.motion_score:.4f}</span></p>
	<p>Keyframe Score: <span class="score">{kf.keyframe_score:.3f}</span></p>
	<p><span class="event-badge {badge_class}">{kf.selection_reason}</span></p>
	{"<p>✨ Enhanced</p>" if kf.frame_data.enhancement_applied else ""}
	</div>
	</div>
	"""

	except Exception as e:
	logger.warning(f"Error processing keyframe {i}: {e}")

	html_template += """
	</div>
	</body>
	</html>
	"""

	return html_template

	def generate_captioning_report(self, captioning_results: Dict[str, Any], statistics: Dict[str, Any]) -> str:
	"""Generate video captioning results report"""

	logger.info("Generating video captioning report")

	report = {
	'metadata': {
	'generation_timestamp': datetime.now().isoformat(),
	'report_version': '1.0'
	},
	'summary': {
	'captioning_enabled': captioning_results.get('enabled', False),
	'total_captions_generated': captioning_results.get('total_captions', 0),
	'processing_time': captioning_results.get('processing_time', 0),
	'errors_count': len(captioning_results.get('errors', []))
	},
	'statistics': statistics,
	'captions': captioning_results.get('captions', []),
	'errors': captioning_results.get('errors', [])
	}

	# Save report
	output_path = os.path.join(self.reports_dir, "video_captioning.json")

	try:
	with open(output_path, 'w') as f:
	json.dump(report, f, indent=2)

	logger.info(f"Video captioning report saved: {output_path}")
	return output_path

	except Exception as e:
	logger.error(f"Failed to save video captioning report: {e}")
	return ""

	# Import numpy for statistics
	import numpy as np