fast

Build error

App Files Files Community

fast / backend /advanced_image_enhancer.py

3v324v23

Update Comic123 with local comic folder files

83e35a7 6 months ago

raw

history blame contribute delete

19.2 kB

	"""
	Advanced Image Enhancement using State-of-the-Art AI Models
	Real-ESRGAN, GFPGAN, and other cutting-edge models
	Optimized for NVIDIA RTX 3050
	"""

	import cv2
	import numpy as np
	import torch
	import torch.nn as nn
	from PIL import Image, ImageEnhance, ImageFilter
	import os
	import requests
	from io import BytesIO
	import time
	from typing import Optional, Tuple
	try:
	from backend.ai_model_manager import get_ai_model_manager
	AI_MODELS_AVAILABLE = True
	except ImportError:
	AI_MODELS_AVAILABLE = False
	print("⚠️ AI models not available, using lightweight enhancer")

	from backend.lightweight_ai_enhancer import get_lightweight_enhancer
	from backend.compact_ai_models import CompactAIEnhancer
	from backend.ultra_compact_enhancer import get_memory_safe_enhancer

	class AdvancedImageEnhancer:
	"""Advanced image enhancement using state-of-the-art AI models"""

	def __init__(self):
	self.device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
	print(f"🎯 Using device: {self.device}")

	# Check VRAM and decide which enhancer to use
	self.use_lightweight = True
	if self.device.type == 'cuda':
	props = torch.cuda.get_device_properties(0)
	vram_gb = props.total_memory / (1024**3)
	print(f"📊 VRAM: {vram_gb:.1f} GB")

	# Use lightweight for <6GB VRAM or if heavy models not available
	if vram_gb < 6 or not AI_MODELS_AVAILABLE:
	self.use_lightweight = True
	print("🚀 Using lightweight enhancer (optimized for <4GB VRAM)")
	else:
	self.use_lightweight = False

	# Initialize appropriate manager
	if self.use_lightweight:
	# Use memory-safe enhancer for <6GB VRAM
	print("🚀 Using memory-safe AI enhancer (<1GB VRAM)")
	self.enhancer = get_memory_safe_enhancer()
	self.ai_manager = None
	self.compact_realesrgan = None
	else:
	self.ai_manager = get_ai_model_manager()
	self.enhancer = None
	self.compact_realesrgan = None

	# Enhancement settings
	self.use_ai_models = os.getenv('USE_AI_MODELS', '1') == '1'
	self.enhance_faces = os.getenv('ENHANCE_FACES', '1') == '1'
	self.use_anime_model = False # Will be set based on content

	# Initialize models
	self._load_models()

	def _load_models(self):
	"""Load AI enhancement models"""
	try:
	if self.use_lightweight:
	print("🚀 Loading lightweight AI models...")
	# Lightweight models load on demand
	self.advanced_available = True
	print("✅ Lightweight enhancer ready")
	else:
	print("🚀 Loading advanced AI models...")

	if self.use_ai_models and self.ai_manager:
	# Load Real-ESRGAN for super resolution
	self.ai_manager.load_realesrgan('RealESRGAN_x4plus')

	# Pre-load anime model for comic style
	self.ai_manager.load_realesrgan('RealESRGAN_x4plus_anime_6B')

	# Load GFPGAN for face enhancement
	if self.enhance_faces:
	self.ai_manager.load_gfpgan()

	self.advanced_available = True
	print("✅ AI models loaded successfully")
	else:
	print("⚠️ AI models disabled, using traditional methods")
	self.advanced_available = False

	except Exception as e:
	print(f"⚠️ Models failed to load: {e}")
	print("⚠️ Falling back to traditional enhancement methods")
	self.advanced_available = False

	def enhance_image(self, image_path: str, output_path: str = None) -> str:
	"""Apply advanced image enhancement"""
	if output_path is None:
	output_path = image_path

	print(f"🚀 Enhancing image: {os.path.basename(image_path)}")

	try:
	# Load image
	img = cv2.imread(image_path)
	if img is None:
	print(f"❌ Failed to load image: {image_path}")
	return image_path

	# Apply enhancement pipeline - pass image_path for compact models
	enhanced_img = self._apply_enhancement_pipeline(img, image_path)

	# Save enhanced image with maximum quality
	cv2.imwrite(output_path, enhanced_img, [cv2.IMWRITE_JPEG_QUALITY, 100])

	print(f"✅ Enhanced image saved: {os.path.basename(output_path)}")
	return output_path

	except Exception as e:
	print(f"❌ Enhancement failed: {e}")
	return image_path

	def _apply_enhancement_pipeline(self, img: np.ndarray, image_path: str = None) -> np.ndarray:
	"""Apply complete enhancement pipeline with AI models"""
	original_img = img.copy()

	print("🎨 Applying AI-powered enhancement pipeline...")

	# Detect if image is anime/comic style
	self.use_anime_model = self._detect_anime_style(img)

	if self.advanced_available and self.use_ai_models:
	try:
	if self.use_lightweight:
	# Use memory-safe enhancer for <4GB VRAM
	print(" 🚀 Applying memory-safe AI enhancement...")

	# Save current image temporarily
	temp_path = image_path.replace('.', '_temp.')
	cv2.imwrite(temp_path, img)

	# Process with memory-safe enhancer
	enhanced_path = self.enhancer.enhance_image(
	temp_path,
	temp_path.replace('_temp.', '_enhanced.')
	)

	# Read enhanced image
	img = cv2.imread(enhanced_path)

	# Clean up temp files
	if os.path.exists(temp_path):
	os.remove(temp_path)
	if os.path.exists(enhanced_path) and enhanced_path != image_path:
	os.remove(enhanced_path)

	print(" ✅ Memory-safe enhancement complete")

	# Show memory usage
	if hasattr(self.enhancer, 'get_memory_usage'):
	print(f" 💾 Memory: {self.enhancer.get_memory_usage()}")
	else:
	# Use full AI models for >6GB VRAM
	print(" 🚀 Applying AI super resolution...")
	img = self.ai_manager.enhance_image_realesrgan(
	img,
	use_anime_model=self.use_anime_model
	)

	# 2. AI Face Enhancement with GFPGAN
	if self.enhance_faces:
	print(" 👤 Enhancing faces with AI...")
	img = self.ai_manager.enhance_face_gfpgan(img)

	# 3. Post-processing
	img = self.ai_manager.post_process(img)

	# Clear GPU memory
	self.ai_manager.clear_memory()

	return img

	except Exception as e:
	print(f"⚠️ AI enhancement failed: {e}, using fallback")
	img = original_img

	# Fallback to traditional methods if AI models not available
	print(" 📈 Using traditional enhancement methods...")

	# 1. Traditional Super Resolution
	img = self._apply_super_resolution_advanced(img)

	# 2. Advanced Color Enhancement
	img = self._enhance_colors_advanced(img)

	# 3. Advanced Noise Reduction
	img = self._reduce_noise_advanced(img)

	# 4. Advanced Sharpness Enhancement
	img = self._enhance_sharpness_advanced(img)

	# 5. Advanced Dynamic Range Optimization
	img = self._optimize_dynamic_range_advanced(img)

	# 6. Traditional Face Enhancement
	img = self._enhance_faces_advanced(img)

	return img

	def _apply_super_resolution_advanced(self, img: np.ndarray) -> np.ndarray:
	"""Advanced super resolution (4x upscaling)"""
	try:
	print("📈 Applying advanced super resolution (4x upscaling)...")

	# Get original dimensions
	height, width = img.shape[:2]

	# Calculate target dimensions (max 2K - 2048x1080)
	scale_factor = min(2048 / width, 1080 / height, 2.0) # Max 2x upscaling
	target_width = int(width * scale_factor)
	target_height = int(height * scale_factor)

	# Use LANCZOS interpolation for highest quality
	img = cv2.resize(img, (target_width, target_height),
	interpolation=cv2.INTER_LANCZOS4)

	# Apply additional sharpening after upscaling
	kernel = np.array([[-1,-1,-1], [-1,9,-1], [-1,-1,-1]])
	img = cv2.filter2D(img, -1, kernel)

	print(f"✅ Super resolution completed: {width}x{height} → {target_width}x{target_height}")

	except Exception as e:
	print(f"⚠️ Super resolution failed: {e}")

	return img

	def _enhance_colors_advanced(self, img: np.ndarray) -> np.ndarray:
	"""Advanced color enhancement"""
	try:
	print("🎨 Applying advanced color enhancement...")

	# Convert to LAB color space for better color processing
	lab = cv2.cvtColor(img, cv2.COLOR_BGR2LAB)

	# Enhance L channel (lightness) with CLAHE
	clahe = cv2.createCLAHE(clipLimit=3.0, tileGridSize=(8,8))
	lab[:,:,0] = clahe.apply(lab[:,:,0])

	# Enhance A and B channels (color) with adaptive scaling
	lab[:,:,1] = cv2.convertScaleAbs(lab[:,:,1], alpha=1.3, beta=10)
	lab[:,:,2] = cv2.convertScaleAbs(lab[:,:,2], alpha=1.3, beta=10)

	# Convert back to BGR
	enhanced = cv2.cvtColor(lab, cv2.COLOR_LAB2BGR)

	# Additional color saturation enhancement
	hsv = cv2.cvtColor(enhanced, cv2.COLOR_BGR2HSV)
	hsv[:,:,1] = cv2.convertScaleAbs(hsv[:,:,1], alpha=1.4, beta=0) # Increase saturation
	enhanced = cv2.cvtColor(hsv, cv2.COLOR_HSV2BGR)

	except Exception as e:
	print(f"⚠️ Color enhancement failed: {e}")
	enhanced = img

	return enhanced

	def _reduce_noise_advanced(self, img: np.ndarray) -> np.ndarray:
	"""Advanced noise reduction"""
	try:
	print("🧹 Applying advanced noise reduction...")

	# Multi-stage noise reduction

	# 1. Bilateral filter for edge-preserving smoothing
	denoised = cv2.bilateralFilter(img, 9, 75, 75)

	# 2. Non-local means denoising for additional noise reduction
	denoised = cv2.fastNlMeansDenoisingColored(denoised, None, 10, 10, 7, 21)

	# 3. Gaussian blur for final smoothing
	denoised = cv2.GaussianBlur(denoised, (3, 3), 0)

	# 4. Edge-preserving filter
	denoised = cv2.edgePreservingFilter(denoised, flags=1, sigma_s=60, sigma_r=0.4)

	except Exception as e:
	print(f"⚠️ Noise reduction failed: {e}")
	denoised = img

	return denoised

	def _enhance_sharpness_advanced(self, img: np.ndarray) -> np.ndarray:
	"""Advanced sharpness enhancement"""
	try:
	print("🔪 Applying advanced sharpness enhancement...")

	# Multi-stage sharpening

	# 1. Unsharp masking
	gaussian = cv2.GaussianBlur(img, (0, 0), 2.0)
	sharpened = cv2.addWeighted(img, 1.5, gaussian, -0.5, 0)

	# 2. Edge enhancement
	kernel = np.array([[-1,-1,-1], [-1,9,-1], [-1,-1,-1]])
	sharpened = cv2.filter2D(sharpened, -1, kernel)

	# 3. Laplacian sharpening
	gray = cv2.cvtColor(sharpened, cv2.COLOR_BGR2GRAY)
	laplacian = cv2.Laplacian(gray, cv2.CV_64F)
	laplacian = np.uint8(np.absolute(laplacian))
	sharpened = cv2.addWeighted(sharpened, 1.0, cv2.cvtColor(laplacian, cv2.COLOR_GRAY2BGR), 0.3, 0)

	except Exception as e:
	print(f"⚠️ Sharpness enhancement failed: {e}")
	sharpened = img

	return sharpened

	def _optimize_dynamic_range_advanced(self, img: np.ndarray) -> np.ndarray:
	"""Advanced dynamic range optimization"""
	try:
	print("📊 Applying advanced dynamic range optimization...")

	# Convert to LAB color space
	lab = cv2.cvtColor(img, cv2.COLOR_BGR2LAB)

	# Apply CLAHE to L channel for better contrast
	clahe = cv2.createCLAHE(clipLimit=2.0, tileGridSize=(8,8))
	lab[:,:,0] = clahe.apply(lab[:,:,0])

	# Enhance contrast in A and B channels
	lab[:,:,1] = cv2.convertScaleAbs(lab[:,:,1], alpha=1.2, beta=0)
	lab[:,:,2] = cv2.convertScaleAbs(lab[:,:,2], alpha=1.2, beta=0)

	# Convert back to BGR
	optimized = cv2.cvtColor(lab, cv2.COLOR_LAB2BGR)

	# Additional contrast enhancement
	optimized = cv2.convertScaleAbs(optimized, alpha=1.1, beta=5)

	except Exception as e:
	print(f"⚠️ Dynamic range optimization failed: {e}")
	optimized = img

	return optimized

	def _enhance_faces_advanced(self, img: np.ndarray) -> np.ndarray:
	"""Advanced face enhancement"""
	try:
	print("👤 Applying advanced face enhancement...")

	# Load face cascade
	face_cascade = cv2.CascadeClassifier(cv2.data.haarcascades + 'haarcascade_frontalface_default.xml')

	# Detect faces
	gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
	faces = face_cascade.detectMultiScale(gray, 1.1, 4)

	if len(faces) > 0:
	print(f"🎭 Found {len(faces)} faces, applying enhancement...")

	for (x, y, w, h) in faces:
	# Extract face region
	face_roi = img[y:y+h, x:x+w]

	# Apply face-specific enhancement
	enhanced_face = self._enhance_face_region(face_roi)

	# Replace face region
	img[y:y+h, x:x+w] = enhanced_face
	else:
	print("👤 No faces detected, skipping face enhancement")

	except Exception as e:
	print(f"⚠️ Face enhancement failed: {e}")

	return img

	def _enhance_face_region(self, face_img: np.ndarray) -> np.ndarray:
	"""Enhance a specific face region"""
	try:
	# Apply gentle smoothing to face
	enhanced = cv2.bilateralFilter(face_img, 5, 50, 50)

	# Enhance skin tone
	hsv = cv2.cvtColor(enhanced, cv2.COLOR_BGR2HSV)
	hsv[:,:,1] = cv2.convertScaleAbs(hsv[:,:,1], alpha=1.1, beta=0) # Gentle saturation boost
	enhanced = cv2.cvtColor(hsv, cv2.COLOR_HSV2BGR)

	# Apply subtle sharpening
	kernel = np.array([[-0.5,-0.5,-0.5], [-0.5,5,-0.5], [-0.5,-0.5,-0.5]])
	enhanced = cv2.filter2D(enhanced, -1, kernel)

	except Exception as e:
	enhanced = face_img

	return enhanced

	def _detect_anime_style(self, img: np.ndarray) -> bool:
	"""Detect if image is anime/manga/comic style"""
	try:
	# Convert to grayscale
	gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)

	# 1. Edge density check - anime has cleaner edges
	edges = cv2.Canny(gray, 50, 150)
	edge_density = np.sum(edges > 0) / edges.size

	# 2. Color count check - anime has fewer unique colors
	unique_colors = len(np.unique(img.reshape(-1, img.shape[2]), axis=0))

	# 3. Gradient smoothness - anime has smoother gradients
	laplacian = cv2.Laplacian(gray, cv2.CV_64F)
	gradient_variance = np.var(laplacian)

	# Decision logic
	is_anime = (
	edge_density < 0.15 and # Clean edges
	unique_colors < 10000 and # Limited color palette
	gradient_variance < 1000 # Smooth gradients
	)

	if is_anime:
	print(" 🎌 Detected anime/comic style - using specialized model")

	return is_anime

	except Exception as e:
	print(f"⚠️ Style detection failed: {e}")
	return False

	def enhance_batch(self, image_paths: list, output_dir: str = None) -> list:
	"""Enhance multiple images"""
	if output_dir is None:
	output_dir = "enhanced"

	os.makedirs(output_dir, exist_ok=True)
	enhanced_paths = []

	print(f"🎯 Enhancing {len(image_paths)} images with advanced techniques...")

	for i, image_path in enumerate(image_paths, 1):
	print(f"📸 Processing {i}/{len(image_paths)}: {os.path.basename(image_path)}")

	# Generate output path
	filename = os.path.basename(image_path)
	output_path = os.path.join(output_dir, f"enhanced_{filename}")

	# Enhance image
	enhanced_path = self.enhance_image(image_path, output_path)
	enhanced_paths.append(enhanced_path)

	print(f"✅ Enhanced {len(enhanced_paths)} images with advanced techniques")
	return enhanced_paths

	# Global instance
	advanced_enhancer = None

	def get_advanced_enhancer():
	"""Get or create global advanced enhancer instance"""
	global advanced_enhancer
	if advanced_enhancer is None:
	advanced_enhancer = AdvancedImageEnhancer()
	return advanced_enhancer

	if __name__ == "__main__":
	# Test the enhancer
	enhancer = AdvancedImageEnhancer()
	print("🧪 Advanced Image Enhancer ready for testing!")