AR_fetchtry / app.py
FaizanShaikh1's picture
Update app.py
479b418 verified
import cv2
import numpy as np
import argparse
import time
import sys
import os
from pathlib import Path
from PIL import Image
import tempfile
import io
import threading
from shiny import App, render, ui, reactive
from shiny.types import ImgData
import base64
# Constants
MODEL_DIR = "models"
TEMP_DIR = "temp"
# Don't import tkinter at the top level
# This allows the app to run in environments without Tkinter (like Hugging Face)
def parse_args():
parser = argparse.ArgumentParser(description='Advanced Virtual Try-On')
parser.add_argument('--garment', type=str, help='Path to garment image')
parser.add_argument('--webcam', type=int, default=0, help='Webcam index to use')
parser.add_argument('--resolution', type=str, default='640x480', help='Camera resolution')
parser.add_argument('--shiny', action='store_true', help='Run in Shiny mode')
parser.add_argument('--tkinter', action='store_true', help='Run with Tkinter UI')
return parser.parse_args()
class HumanPoseEstimator:
"""Human pose estimation using OpenPose or similar model"""
def __init__(self):
# Create model directory if it doesn't exist
if not os.path.exists(MODEL_DIR):
os.makedirs(MODEL_DIR)
# Download pose model if not present (simplified here)
self.download_models_if_needed()
# Load COCO body model for OpenPose
self.BODY_PARTS = {
"Nose": 0, "Neck": 1, "RShoulder": 2, "RElbow": 3, "RWrist": 4,
"LShoulder": 5, "LElbow": 6, "LWrist": 7, "RHip": 8, "RKnee": 9,
"RAnkle": 10, "LHip": 11, "LKnee": 12, "LAnkle": 13, "REye": 14,
"LEye": 15, "REar": 16, "LEar": 17, "Background": 18
}
self.POSE_PAIRS = [
["Neck", "RShoulder"], ["Neck", "LShoulder"], ["RShoulder", "RElbow"],
["RElbow", "RWrist"], ["LShoulder", "LElbow"], ["LElbow", "LWrist"],
["Neck", "RHip"], ["RHip", "RKnee"], ["RKnee", "RAnkle"], ["Neck", "LHip"],
["LHip", "LKnee"], ["LKnee", "LAnkle"], ["Neck", "Nose"], ["Nose", "REye"],
["REye", "REar"], ["Nose", "LEye"], ["LEye", "LEar"]
]
# Load OpenPose network
self.net = self.load_pose_model()
print("Pose estimation model loaded successfully")
def download_models_if_needed(self):
"""Download models if not present"""
# Model paths
pose_model_path = os.path.join(MODEL_DIR, "pose_iter_440000.caffemodel")
pose_proto_path = os.path.join(MODEL_DIR, "pose_deploy_linevec.prototxt")
# Check if models exist
if not os.path.exists(pose_model_path) or not os.path.exists(pose_proto_path):
print("Models not found. Downloading pose estimation models...")
# Normally we'd download the models here using requests or urllib
# For this example, we'll direct the user to download them manually
print("Please download the OpenPose model:")
print(f"1. Download pose_iter_440000.caffemodel to {MODEL_DIR}")
print(f"2. Download pose_deploy_linevec.prototxt to {MODEL_DIR}")
print("Models can be found at: https://github.com/CMU-Perceptual-Computing-Lab/openpose/tree/master/models")
# Create directory for models
Path(MODEL_DIR).mkdir(parents=True, exist_ok=True)
# For demonstration, we'll create dummy files with instructions
with open(pose_proto_path, 'w') as f:
f.write("# Download the actual model file from OpenPose repository")
with open(pose_model_path, 'w') as f:
f.write("# Download the actual model file from OpenPose repository")
print("Created placeholder files. Replace with actual model files before running.")
def load_pose_model(self):
"""Load the pose detection model"""
try:
# Try to load the OpenPose model
model_path = os.path.join(MODEL_DIR, "pose_iter_440000.caffemodel")
config_path = os.path.join(MODEL_DIR, "pose_deploy_linevec.prototxt")
if os.path.getsize(model_path) < 1000: # Placeholder file
print("Warning: Using placeholder model file. Results will be simulated.")
# Fall back to a basic pose estimation
return None
net = cv2.dnn.readNetFromCaffe(config_path, model_path)
# Try to use GPU if available - safely check for CUDA availability
try:
# Check if CUDA is available by testing if the cv2.cuda module exists
cuda_available = False
if hasattr(cv2, 'cuda'):
try:
cuda_available = cv2.cuda.getCudaEnabledDeviceCount() > 0
except:
cuda_available = False
if cuda_available:
print("CUDA is available. Using GPU acceleration.")
net.setPreferableBackend(cv2.dnn.DNN_BACKEND_CUDA)
net.setPreferableTarget(cv2.dnn.DNN_TARGET_CUDA)
else:
print("CUDA is not available. Using CPU.")
net.setPreferableBackend(cv2.dnn.DNN_BACKEND_DEFAULT)
net.setPreferableTarget(cv2.dnn.DNN_TARGET_CPU)
except Exception as cuda_err:
print(f"Error checking CUDA availability: {cuda_err}. Using CPU instead.")
net.setPreferableBackend(cv2.dnn.DNN_BACKEND_DEFAULT)
net.setPreferableTarget(cv2.dnn.DNN_TARGET_CPU)
return net
except Exception as e:
print(f"Error loading pose model: {e}")
print("Falling back to simulation mode")
return None
def estimate_pose(self, frame):
"""Estimate human pose in the frame"""
frame_height, frame_width = frame.shape[:2]
# If we don't have the actual model, simulate pose detection
if self.net is None:
return self.simulate_pose(frame)
# Prepare input for the network
input_blob = cv2.dnn.blobFromImage(frame, 1.0 / 255, (368, 368), (0, 0, 0), swapRB=False, crop=False)
self.net.setInput(input_blob)
# Forward pass through the network
output = self.net.forward()
# Parse keypoints
keypoints = []
threshold = 0.1
for i in range(len(self.BODY_PARTS) - 1): # Exclude background
# Get confidence map
prob_map = output[0, i, :, :]
prob_map = cv2.resize(prob_map, (frame_width, frame_height))
# Find global maximum
_, confidence, _, point = cv2.minMaxLoc(prob_map)
if confidence > threshold:
keypoints.append((point[0], point[1], confidence))
else:
keypoints.append(None)
return keypoints
def simulate_pose(self, frame):
"""Simulate pose detection when model isn't available"""
# Use face detection to estimate body position
face_cascade = cv2.CascadeClassifier(cv2.data.haarcascades + 'haarcascade_frontalface_default.xml')
gray = cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY)
faces = face_cascade.detectMultiScale(gray, 1.3, 5)
# Initialize keypoints
keypoints = [None] * (len(self.BODY_PARTS) - 1)
if len(faces) > 0:
# Get the largest face
x, y, w, h = max(faces, key=lambda rect: rect[2] * rect[3])
# Center of face
face_center_x = x + w // 2
face_center_y = y + h // 2
# Estimate keypoints based on face position
frame_height, frame_width = frame.shape[:2]
# Nose (center of face)
keypoints[self.BODY_PARTS["Nose"]] = (face_center_x, face_center_y, 0.9)
# Neck (below face)
neck_y = y + h + h // 4
keypoints[self.BODY_PARTS["Neck"]] = (face_center_x, neck_y, 0.8)
# Shoulders (on either side of neck)
shoulder_y = neck_y + h // 8
keypoints[self.BODY_PARTS["RShoulder"]] = (face_center_x - w, shoulder_y, 0.7)
keypoints[self.BODY_PARTS["LShoulder"]] = (face_center_x + w, shoulder_y, 0.7)
# Approximate other body parts
keypoints[self.BODY_PARTS["RHip"]] = (face_center_x - w//2, frame_height - h*2, 0.5)
keypoints[self.BODY_PARTS["LHip"]] = (face_center_x + w//2, frame_height - h*2, 0.5)
return keypoints
def draw_skeleton(self, frame, keypoints):
"""Draw skeleton on the frame for visualization"""
# Draw keypoints
for i, keypoint in enumerate(keypoints):
if keypoint:
cv2.circle(frame, (int(keypoint[0]), int(keypoint[1])), 8, (0, 255, 255), thickness=-1, lineType=cv2.FILLED)
# Draw connections
for pair in self.POSE_PAIRS:
part_from = self.BODY_PARTS[pair[0]]
part_to = self.BODY_PARTS[pair[1]]
if keypoints[part_from] and keypoints[part_to]:
cv2.line(frame,
(int(keypoints[part_from][0]), int(keypoints[part_from][1])),
(int(keypoints[part_to][0]), int(keypoints[part_to][1])),
(0, 255, 0), 3)
return frame
class GarmentProcessor:
"""Process garment images for virtual try-on"""
def __init__(self):
# Create temp directory for processed images
if not os.path.exists(TEMP_DIR):
os.makedirs(TEMP_DIR)
def load_garment(self, path):
"""Load and preprocess a garment image"""
# Load the image
garment = cv2.imread(path, cv2.IMREAD_UNCHANGED)
if garment is None:
raise FileNotFoundError(f"Could not load garment image from {path}")
# If garment doesn't have alpha channel, add one
if garment.shape[2] == 3:
garment = self.remove_background(garment)
return garment
def remove_background(self, img):
"""Remove background from garment image including black backgrounds"""
# Convert to RGBA
rgba = cv2.cvtColor(img, cv2.COLOR_BGR2BGRA)
# Get image dimensions
h, w = img.shape[:2]
# Create an initial mask
# Instead of simple thresholding which fails for black clothes,
# we'll use a combination of techniques
# 1. Start with an approximate mask using color detection
# Convert to different color spaces
hsv = cv2.cvtColor(img, cv2.COLOR_BGR2HSV)
gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
# Create masks for different color spaces
# Detect very dark regions (potential black backgrounds)
_, dark_mask = cv2.threshold(gray, 30, 255, cv2.THRESH_BINARY)
# Detect edges - useful for finding garment boundaries
edges = cv2.Canny(img, 50, 150)
kernel = np.ones((5,5), np.uint8)
dilated_edges = cv2.dilate(edges, kernel, iterations=2)
# Create initial GrabCut mask
# 0 = background, 1 = foreground, 2 = probable background, 3 = probable foreground
gc_mask = np.zeros(img.shape[:2], np.uint8)
# Mark the borders as likely background
border_width = w // 10 # 10% of width
gc_mask[:border_width, :] = 2
gc_mask[-border_width:, :] = 2
gc_mask[:, :border_width] = 2
gc_mask[:, -border_width:] = 2
# Mark the center as likely foreground
center_rect = (border_width, border_width, w - 2*border_width, h - 2*border_width)
cv2.rectangle(gc_mask, (center_rect[0], center_rect[1]),
(center_rect[0] + center_rect[2], center_rect[1] + center_rect[3]), 3, -1)
# Use edges to refine foreground
gc_mask[dilated_edges > 0] = 1
# Initialize GrabCut background and foreground models
bgd_model = np.zeros((1, 65), np.float64)
fgd_model = np.zeros((1, 65), np.float64)
# Run GrabCut algorithm
try:
cv2.grabCut(img, gc_mask, center_rect, bgd_model, fgd_model, 5, cv2.GC_INIT_WITH_MASK)
except Exception as e:
print(f"GrabCut failed: {e}. Using fallback method.")
# Fallback to simpler method if GrabCut fails
# Create a simple mask based on color threshold
_, mask = cv2.threshold(gray, 200, 255, cv2.THRESH_BINARY_INV)
kernel = np.ones((5, 5), np.uint8)
mask = cv2.morphologyEx(mask, cv2.MORPH_OPEN, kernel)
mask = cv2.morphologyEx(mask, cv2.MORPH_CLOSE, kernel)
rgba[:, :, 3] = mask
return rgba
# Create final mask where 1 and 3 are foreground
final_mask = np.where((gc_mask == 1) | (gc_mask == 3), 255, 0).astype('uint8')
# Clean up mask with morphological operations
kernel = np.ones((5, 5), np.uint8)
final_mask = cv2.morphologyEx(final_mask, cv2.MORPH_OPEN, kernel)
final_mask = cv2.morphologyEx(final_mask, cv2.MORPH_CLOSE, kernel)
# Dilate the mask slightly to include edge details
final_mask = cv2.dilate(final_mask, kernel, iterations=1)
# Apply mask to alpha channel
rgba[:, :, 3] = final_mask
print("Added transparency to garment image with advanced background removal")
return rgba
def warp_garment(self, garment, keypoints, frame_size, sizing_params=None):
"""Warp the garment to fit the detected pose"""
frame_height, frame_width = frame_size
# Set default sizing parameters if not provided
if sizing_params is None:
sizing_params = {
'width_scale': 1.2, # Default width scale - reduced for better fit
'height_scale': 1.1 # Default height scale
}
# If no valid keypoints, return original garment
if not keypoints or not keypoints[1]: # Check if neck keypoint exists
return garment
# Get relevant keypoints for garment warping
neck = keypoints[1]
right_shoulder = keypoints[2]
left_shoulder = keypoints[5]
right_hip = keypoints[8]
left_hip = keypoints[11]
if not all([neck, right_shoulder, left_shoulder]):
return garment # Not enough keypoints
# Calculate garment dimensions based on body
if right_shoulder and left_shoulder:
# Calculate Euclidean distance between shoulders
shoulder_width = np.linalg.norm(
[left_shoulder[0] - right_shoulder[0], left_shoulder[1] - right_shoulder[1]]
)
# Get angle between shoulders for rotation
shoulder_angle = np.arctan2(
left_shoulder[1] - right_shoulder[1],
left_shoulder[0] - right_shoulder[0]
) * 180 / np.pi
else:
shoulder_width = frame_width * 0.2 # Fallback
shoulder_angle = 0
# Calculate torso measurements for better proportions
torso_height = 0
if right_hip and left_hip and neck:
# Distance from neck to hips
hip_center_x = (left_hip[0] + right_hip[0]) / 2
hip_center_y = (left_hip[1] + right_hip[1]) / 2
torso_height = np.linalg.norm([hip_center_x - neck[0], hip_center_y - neck[1]])
else:
# Estimate torso height based on shoulder width and typical human proportions
# Use a more conservative estimate for better fit
torso_height = shoulder_width * 1.4 # Adjusted from 1.6 for better fit
# Calculate body size estimate
body_width = shoulder_width * 1.1 # Slightly wider than shoulders (reduced from 1.2)
# Get garment original dimensions
garment_height, garment_width = garment.shape[:2]
# Calculate aspect ratio of the garment
garment_aspect = garment_width / float(garment_height) if garment_height > 0 else 1.0
# Calculate ideal dimensions for the garment based on body
# For t-shirts: width should cover shoulders plus some extra, height should cover torso
ideal_width = shoulder_width * sizing_params['width_scale']
ideal_height = torso_height * sizing_params['height_scale']
# Maintain aspect ratio while fitting to body
if (ideal_width / ideal_height) > garment_aspect:
# Width-constrained: use ideal width, calculate height to maintain aspect
target_width = int(ideal_width)
target_height = int(target_width / garment_aspect)
else:
# Height-constrained: use ideal height, calculate width to maintain aspect
target_height = int(ideal_height)
target_width = int(target_height * garment_aspect)
# Resize garment to target dimensions
garment_resized = self.resize_garment(garment, target_width, target_height)
# Apply rotation if shoulders aren't level (beyond a small threshold)
if abs(shoulder_angle) > 5:
center = (garment_resized.shape[1] // 2, garment_resized.shape[0] // 2)
rotation_matrix = cv2.getRotationMatrix2D(center, shoulder_angle, 1.0)
garment_resized = cv2.warpAffine(
garment_resized, rotation_matrix,
(garment_resized.shape[1], garment_resized.shape[0]),
flags=cv2.INTER_LINEAR, borderMode=cv2.BORDER_TRANSPARENT
)
# Apply perspective transform to better fit the body shape
try:
# Only apply perspective transform if we have all four corners (shoulders and hips)
if all([right_shoulder, left_shoulder, right_hip, left_hip]):
# Define source points (corners of the garment)
garment_h, garment_w = garment_resized.shape[:2]
src_pts = np.array([
[0, 0], # Top-left
[garment_w, 0], # Top-right
[garment_w, garment_h], # Bottom-right
[0, garment_h] # Bottom-left
], dtype=np.float32)
# Define destination points based on body keypoints
# Scale factors to find garment edges from body keypoints
top_width_factor = 1.1 # How much wider than shoulders at top
bottom_width_factor = 0.9 # How much wider than hips at bottom
# Calculate destination points
top_left_x = left_shoulder[0] - (shoulder_width * (top_width_factor - 1) / 2)
top_right_x = right_shoulder[0] + (shoulder_width * (top_width_factor - 1) / 2)
bottom_left_x = left_hip[0] - (shoulder_width * (bottom_width_factor - 1) / 2)
bottom_right_x = right_hip[0] + (shoulder_width * (bottom_width_factor - 1) / 2)
# Get y-coordinates (adjust top to be at collar position)
top_y = (left_shoulder[1] + right_shoulder[1]) / 2 - garment_h * 0.2
bottom_y = top_y + garment_h * 0.95 # Slightly higher than full height for better look
dst_pts = np.array([
[top_left_x, top_y], # Top-left
[top_right_x, top_y], # Top-right
[bottom_right_x, bottom_y], # Bottom-right
[bottom_left_x, bottom_y] # Bottom-left
], dtype=np.float32)
# Get perspective transform matrix
M = cv2.getPerspectiveTransform(src_pts, dst_pts)
# Apply perspective transform
# Make output size large enough to contain the warped garment
output_size = (frame_width, frame_height)
warped = cv2.warpPerspective(garment_resized, M, output_size,
flags=cv2.INTER_LINEAR, borderMode=cv2.BORDER_TRANSPARENT)
# Crop to the actual garment size to avoid large transparent areas
# Find non-zero alpha channel pixels
alpha = warped[:, :, 3]
coords = cv2.findNonZero(alpha)
if coords is not None and len(coords) > 0:
x, y, w, h = cv2.boundingRect(coords)
warped = warped[y:y+h, x:x+w]
return warped
except Exception as e:
print(f"Perspective transform failed: {e}")
# Continue with the regular garment if perspective transform fails
pass
print(f"Resized garment to fit body: {target_width}x{target_height} px")
return garment_resized
def resize_garment(self, garment, target_width=None, target_height=None):
"""Resize garment maintaining aspect ratio"""
if garment is None:
return None
garment_height, garment_width = garment.shape[:2]
aspect = garment_width / float(garment_height)
if target_width is not None:
new_width = target_width
new_height = int(new_width / aspect)
elif target_height is not None:
new_height = target_height
new_width = int(new_height * aspect)
else:
return garment # No resize if no dimensions provided
# High-quality resize
resized = cv2.resize(garment, (new_width, new_height), interpolation=cv2.INTER_LANCZOS4)
return resized
class AdvancedVirtualTryOn:
"""Main class for the virtual try-on system"""
def __init__(self, garment_path, camera_index=0, resolution="640x480", shiny_mode=False):
# Parse resolution
width, height = map(int, resolution.split('x'))
# Set Shiny mode
self.shiny_mode = shiny_mode
# Detect if running on Hugging Face
self.is_huggingface = os.environ.get('SPACE_ID') is not None
# Initialize components
self.pose_estimator = HumanPoseEstimator()
self.garment_processor = GarmentProcessor()
# Load garment
self.garment = self.garment_processor.load_garment(garment_path)
# Initialize camera if not in Shiny mode or handle errors gracefully
if not shiny_mode:
try:
self.camera = cv2.VideoCapture(camera_index)
self.camera.set(cv2.CAP_PROP_FRAME_WIDTH, width)
self.camera.set(cv2.CAP_PROP_FRAME_HEIGHT, height)
if not self.camera.isOpened():
print("Warning: Could not open camera. Using fallback mode.")
self.create_dummy_camera(width, height)
except Exception as e:
print(f"Error initializing camera: {e}. Using fallback mode.")
self.create_dummy_camera(width, height)
# Performance tracking
self.prev_frame_time = 0
self.new_frame_time = 0
self.fps = 0
# Garment positioning and sizing parameters - adjusted for better default fit
self.vertical_offset = 0.05
self.width_scale = 1.2 # Reduced from 1.5 for a more realistic fit
self.height_scale = 1.1 # Scale factor for garment height relative to torso
self.collar_position = 0.20 # Increased to position collar higher on neck
# UI modes
self.debug_mode = False
self.show_controls = True
self.fullscreen_mode = False
# For smoother processing and better performance
self.skip_frames = 0 # Process every frame by default
self.frame_counter = 0
self.last_warped_garment = None
self.last_keypoints = None
print("Advanced Virtual Try-On initialized.")
if not shiny_mode:
print("Starting camera feed...")
def create_dummy_camera(self, width, height):
"""Create a dummy camera object for environments without webcam access"""
# Create a dummy camera object that returns a test pattern
self.using_dummy_camera = True
self.camera = type('DummyCamera', (), {
'read': lambda _: (True, self.create_dummy_frame(width, height)),
'isOpened': lambda _: True,
'release': lambda _: None
})()
print("Using dummy camera (static test pattern).")
def create_dummy_frame(self, width, height):
"""Create a test pattern frame for the dummy camera"""
# Create a checkerboard pattern
frame = np.zeros((height, width, 3), dtype=np.uint8)
tile_size = 50
for i in range(0, height, tile_size):
for j in range(0, width, tile_size):
if (i // tile_size + j // tile_size) % 2 == 0:
frame[i:i+tile_size, j:j+tile_size] = 255
# Add some text
cv2.putText(frame, "Webcam not available", (width//2 - 150, height//2),
cv2.FONT_HERSHEY_SIMPLEX, 1, (0, 0, 255), 2, cv2.LINE_AA)
cv2.putText(frame, "Using test pattern", (width//2 - 130, height//2 + 40),
cv2.FONT_HERSHEY_SIMPLEX, 1, (0, 0, 255), 2, cv2.LINE_AA)
return frame
def update_fps(self):
"""Calculate and update FPS"""
self.new_frame_time = time.time()
self.fps = 1 / (self.new_frame_time - self.prev_frame_time) if (self.new_frame_time - self.prev_frame_time) > 0 else 0
self.prev_frame_time = self.new_frame_time
return int(self.fps)
def overlay_garment(self, frame, keypoints):
"""Overlay the garment on the frame"""
frame_height, frame_width = frame.shape[:2]
# Check if we have valid keypoints
if not keypoints or not keypoints[1]: # Neck keypoint
# Use last valid keypoints if available for smoothness
if self.last_keypoints and self.last_warped_garment is not None:
keypoints = self.last_keypoints
else:
return frame
else:
# Store last valid keypoints for smooth transitions
self.last_keypoints = keypoints
try:
# Get key body keypoints
neck = keypoints[1]
right_shoulder = keypoints[2]
left_shoulder = keypoints[5]
if not all([neck, right_shoulder, left_shoulder]):
if self.last_warped_garment is not None:
# Use last valid garment if available
warped_garment = self.last_warped_garment
else:
return frame
else:
# Calculate shoulder midpoint for better centering
shoulder_center_x = (right_shoulder[0] + left_shoulder[0]) / 2
shoulder_center_y = (right_shoulder[1] + left_shoulder[1]) / 2
# Check if we should skip processing this frame (for performance)
self.frame_counter += 1
if self.skip_frames > 0 and self.frame_counter % (self.skip_frames + 1) != 0 and self.last_warped_garment is not None:
warped_garment = self.last_warped_garment
else:
# Pass current sizing parameters to warp_garment
sizing_params = {
'width_scale': self.width_scale,
'height_scale': self.height_scale
}
# Warp garment to fit the body
warped_garment = self.garment_processor.warp_garment(
self.garment, keypoints, (frame_height, frame_width), sizing_params
)
# Save for potential reuse
self.last_warped_garment = warped_garment
if warped_garment is None:
return frame
# Calculate position
garment_height, garment_width = warped_garment.shape[:2]
if all([neck, right_shoulder, left_shoulder]):
# Center horizontally on shoulders rather than neck for better alignment
center_x = int(shoulder_center_x)
# Calculate vertical position based on neck and shoulders
# Position garment higher for more natural look
shoulder_y = (right_shoulder[1] + left_shoulder[1]) / 2
center_y = int(neck[1] + (shoulder_y - neck[1]) * 0.5 - (garment_height * self.collar_position))
else:
# Fallback to last known position
center_x = frame_width // 2
center_y = frame_height // 3
# Calculate top-left corner
x1 = center_x - garment_width // 2
y1 = center_y
# Ensure coordinates are within frame
x1 = max(0, x1)
y1 = max(0, y1)
x2 = min(frame_width, x1 + garment_width)
y2 = min(frame_height, y1 + garment_height)
# Calculate source region in garment
g_x1 = 0
g_y1 = 0
g_x2 = x2 - x1
g_y2 = y2 - y1
if g_x2 <= 0 or g_y2 <= 0 or g_x1 >= garment_width or g_y1 >= garment_height:
return frame
# Adjust if needed
if g_x2 > garment_width:
g_x2 = garment_width
x2 = x1 + g_x2
if g_y2 > garment_height:
g_y2 = garment_height
y2 = y1 + g_y2
# Extract regions
roi = frame[y1:y2, x1:x2].copy()
garment_roi = warped_garment[g_y1:g_y2, g_x1:g_x2].copy()
if roi.shape[:2] != garment_roi.shape[:2]:
return frame
# Improved alpha blending with edge feathering
alpha = garment_roi[:, :, 3] / 255.0
# Apply Gaussian blur to alpha channel for softer edges
alpha_blur = cv2.GaussianBlur(alpha, (5, 5), 0)
alpha_blur = np.repeat(alpha_blur[:, :, np.newaxis], 3, axis=2)
# Blend images with the smoothed alpha
blended = roi * (1 - alpha_blur) + garment_roi[:, :, :3] * alpha_blur
# Apply color correction to match lighting
# This helps the garment look more natural in the scene
mean_roi = np.mean(roi, axis=(0, 1))
mean_garment = np.mean(garment_roi[:, :, :3], axis=(0, 1))
# Apply subtle lighting adjustment (limit the effect for realism)
lighting_factor = 0.3
lighting_adjustment = (mean_roi - mean_garment) * lighting_factor
adjusted_garment = np.clip(garment_roi[:, :, :3] + lighting_adjustment, 0, 255)
# Final blending with lighting adjustment
final_blend = roi * (1 - alpha_blur) + adjusted_garment * alpha_blur
frame[y1:y2, x1:x2] = final_blend
except Exception as e:
print(f"Error overlaying garment: {e}")
return frame
def process_frame(self, frame):
"""Process a single frame, returning the processed frame"""
# Flip for mirror effect
frame = cv2.flip(frame, 1)
# Estimate pose
keypoints = self.pose_estimator.estimate_pose(frame)
# Overlay garment
frame = self.overlay_garment(frame, keypoints)
# Draw skeleton in debug mode
if self.debug_mode:
frame = self.pose_estimator.draw_skeleton(frame, keypoints)
# Calculate and display FPS
fps = self.update_fps()
cv2.putText(frame, f"FPS: {fps}", (10, 30), cv2.FONT_HERSHEY_SIMPLEX,
1, (0, 255, 0), 2, cv2.LINE_AA)
# Display current garment fit parameters
if self.show_controls and not self.shiny_mode:
# Display fitting instructions
instructions = [
"Controls:",
f"Width Scale: {self.width_scale:.1f} (+/- to adjust)",
f"Height Scale: {self.height_scale:.1f} (up/down arrows)",
f"Collar Position: {self.collar_position:.2f} (</> to adjust)",
f"Performance: {'High' if self.skip_frames>0 else 'Normal'} (f key)",
f"Display: {'Fullscreen' if self.fullscreen_mode else 'Window'} (s key)",
"'d' - Toggle debug | 'q' - Quit | 'c' - Hide controls"
]
y_pos = 70
for line in instructions:
cv2.putText(frame, line, (10, y_pos), cv2.FONT_HERSHEY_SIMPLEX,
0.5, (0, 255, 0), 1, cv2.LINE_AA)
y_pos += 25
elif not self.shiny_mode:
cv2.putText(frame, "Press 'c' for controls", (10, 70),
cv2.FONT_HERSHEY_SIMPLEX, 0.7, (0, 255, 0), 1, cv2.LINE_AA)
return frame
def run(self):
"""Main application loop"""
if self.shiny_mode:
print("Shiny mode is active. The main loop will be controlled by the Shiny app.")
return
print("Advanced Virtual Try-On started. Press 'q' to quit, 'd' to toggle debug mode.")
print("Use '+'/'-' to adjust garment width, 'up'/'down' arrows to adjust height.")
print("Use 'c' to toggle control instructions, 'f' to toggle frame skipping for better performance.")
print("Press 's' to toggle fullscreen mode.")
# Create a resizable window
cv2.namedWindow('Advanced Virtual Try-On', cv2.WINDOW_NORMAL)
while self.camera.isOpened():
success, frame = self.camera.read()
if not success:
print("Failed to capture frame")
break
# Process the frame
frame = self.process_frame(frame)
# Display the result
cv2.imshow('Advanced Virtual Try-On', frame)
# Handle key presses
key = cv2.waitKey(1) & 0xFF
# Quit
if key == ord('q'):
break
# Toggle debug mode
elif key == ord('d'):
self.debug_mode = not self.debug_mode
print(f"Debug mode: {'ON' if self.debug_mode else 'OFF'}")
# Toggle control display
elif key == ord('c'):
self.show_controls = not self.show_controls
# Toggle fullscreen mode
elif key == ord('s'):
self.fullscreen_mode = not self.fullscreen_mode
if self.fullscreen_mode:
cv2.setWindowProperty('Advanced Virtual Try-On', cv2.WND_PROP_FULLSCREEN, cv2.WINDOW_FULLSCREEN)
print("Fullscreen mode enabled")
else:
cv2.setWindowProperty('Advanced Virtual Try-On', cv2.WND_PROP_FULLSCREEN, cv2.WINDOW_NORMAL)
print("Window mode enabled")
# Adjust width scale
elif key == ord('+') or key == ord('='): # = is on the same key as + without shift
self.width_scale = min(3.0, self.width_scale + 0.1)
print(f"Width scale: {self.width_scale:.1f}")
elif key == ord('-'):
self.width_scale = max(0.8, self.width_scale - 0.1)
print(f"Width scale: {self.width_scale:.1f}")
# Adjust height scale
elif key == 82: # Up arrow
self.height_scale = min(2.0, self.height_scale + 0.1)
print(f"Height scale: {self.height_scale:.1f}")
elif key == 84: # Down arrow
self.height_scale = max(0.6, self.height_scale - 0.1)
print(f"Height scale: {self.height_scale:.1f}")
# Adjust collar position
elif key == ord(',') or key == ord('<'):
self.collar_position = max(0.05, self.collar_position - 0.01)
print(f"Collar position: {self.collar_position:.2f}")
elif key == ord('.') or key == ord('>'):
self.collar_position = min(0.3, self.collar_position + 0.01)
print(f"Collar position: {self.collar_position:.2f}")
# Toggle performance mode
elif key == ord('f'):
# Toggle between 0, 1, and 2 frame skips
self.skip_frames = (self.skip_frames + 1) % 3
print(f"Performance mode: {'High (skip {self.skip_frames} frames)' if self.skip_frames>0 else 'Normal'}")
# Clean up
self.clean_up()
def clean_up(self):
"""Clean up resources"""
if hasattr(self, 'camera') and not self.shiny_mode and self.camera.isOpened():
self.camera.release()
cv2.destroyAllWindows()
print("Application closed.")
class TkinterUI:
"""Tkinter UI for the virtual try-on application"""
def __init__(self, webcam_index=0, resolution="640x480"):
# Import tkinter here instead of at the top level
try:
import tkinter as tk
from tkinter import filedialog, Label, Button, Frame
self.tk_available = True
except ImportError:
print("Tkinter is not available in this environment.")
self.tk_available = False
return
self.webcam_index = webcam_index
self.width, self.height = map(int, resolution.split('x'))
self.app = None
self.running = False
self.garment_path = None
self.root = None
self.webcam_label = None
self.update_interval = 10 # Update every 10ms
def start(self):
"""Start the Tkinter UI"""
if not self.tk_available:
print("Cannot start Tkinter UI: Tkinter is not available.")
return
# Import tkinter here to use its symbols
import tkinter as tk
from tkinter import filedialog, Label, Button, Frame
self.root = tk.Tk()
self.root.title("Virtual Try-On")
self.root.geometry(f"{self.width + 300}x{self.height + 100}")
self.root.resizable(True, True)
self.root.protocol("WM_DELETE_WINDOW", self.on_close)
# Main frame
main_frame = Frame(self.root)
main_frame.pack(fill=tk.BOTH, expand=True, padx=10, pady=10)
# Left side - webcam and controls
left_frame = Frame(main_frame)
left_frame.pack(side=tk.LEFT, fill=tk.BOTH, expand=True)
# Webcam frame
webcam_frame = Frame(left_frame, width=self.width, height=self.height)
webcam_frame.pack(pady=10)
webcam_frame.pack_propagate(0) # Don't shrink
self.webcam_label = Label(webcam_frame)
self.webcam_label.pack(fill=tk.BOTH, expand=True)
# Control buttons
control_frame = Frame(left_frame)
control_frame.pack(fill=tk.X, pady=10)
upload_btn = Button(control_frame, text="Upload Garment", command=self.upload_garment)
upload_btn.pack(side=tk.LEFT, padx=5)
start_btn = Button(control_frame, text="Start Try-On", command=self.start_tryon)
start_btn.pack(side=tk.LEFT, padx=5)
stop_btn = Button(control_frame, text="Stop", command=self.stop_tryon)
stop_btn.pack(side=tk.LEFT, padx=5)
# Right side - adjustments and garment preview
right_frame = Frame(main_frame, width=280)
right_frame.pack(side=tk.RIGHT, fill=tk.Y, padx=10)
right_frame.pack_propagate(0) # Don't shrink
# Garment preview
preview_label = Label(right_frame, text="Garment Preview")
preview_label.pack(pady=(0, 5))
self.garment_preview = Label(right_frame, text="No garment selected")
self.garment_preview.pack(pady=5)
# Adjustments
adjustments_label = Label(right_frame, text="Adjustments")
adjustments_label.pack(pady=(15, 5))
# Width scale slider
width_frame = Frame(right_frame)
width_frame.pack(fill=tk.X, pady=5)
Label(width_frame, text="Width:").pack(side=tk.LEFT)
self.width_scale_var = tk.DoubleVar(value=1.2)
self.width_scale = tk.Scale(width_frame, from_=0.8, to=3.0, resolution=0.1, orient=tk.HORIZONTAL,
variable=self.width_scale_var, command=self.update_params)
self.width_scale.pack(side=tk.RIGHT, fill=tk.X, expand=True)
# Height scale slider
height_frame = Frame(right_frame)
height_frame.pack(fill=tk.X, pady=5)
Label(height_frame, text="Height:").pack(side=tk.LEFT)
self.height_scale_var = tk.DoubleVar(value=1.1)
self.height_scale = tk.Scale(height_frame, from_=0.6, to=2.0, resolution=0.1, orient=tk.HORIZONTAL,
variable=self.height_scale_var, command=self.update_params)
self.height_scale.pack(side=tk.RIGHT, fill=tk.X, expand=True)
# Collar position slider
collar_frame = Frame(right_frame)
collar_frame.pack(fill=tk.X, pady=5)
Label(collar_frame, text="Collar:").pack(side=tk.LEFT)
self.collar_var = tk.DoubleVar(value=0.2)
self.collar_scale = tk.Scale(collar_frame, from_=0.05, to=0.3, resolution=0.01, orient=tk.HORIZONTAL,
variable=self.collar_var, command=self.update_params)
self.collar_scale.pack(side=tk.RIGHT, fill=tk.X, expand=True)
# Debug mode checkbox
debug_frame = Frame(right_frame)
debug_frame.pack(fill=tk.X, pady=5)
self.debug_var = tk.BooleanVar(value=False)
debug_check = tk.Checkbutton(debug_frame, text="Show Skeleton", variable=self.debug_var,
command=self.update_params)
debug_check.pack(side=tk.LEFT)
# Status label
self.status_label = Label(right_frame, text="Ready")
self.status_label.pack(pady=10)
# Start main loop
self.root.mainloop()
def upload_garment(self):
"""Open file dialog to select a garment image"""
filetypes = [
("Image files", "*.png *.jpg *.jpeg"),
("PNG files", "*.png"),
("JPEG files", "*.jpg *.jpeg"),
("All files", "*.*")
]
self.garment_path = filedialog.askopenfilename(
title="Select Garment Image",
filetypes=filetypes
)
if self.garment_path:
self.status_label.config(text=f"Garment selected: {os.path.basename(self.garment_path)}")
self.load_preview()
def load_preview(self):
"""Load and display the garment preview"""
if not self.garment_path:
return
try:
# Load image with PIL for preview
pil_img = Image.open(self.garment_path)
# Resize for preview (keep aspect ratio)
preview_width = 250
aspect_ratio = pil_img.width / pil_img.height
preview_height = int(preview_width / aspect_ratio)
# Limit height
if preview_height > 300:
preview_height = 300
preview_width = int(preview_height * aspect_ratio)
pil_img = pil_img.resize((preview_width, preview_height), Image.LANCZOS)
# Convert to Tkinter format
tk_img = ImageTk.PhotoImage(pil_img)
# Update preview
self.garment_preview.config(image=tk_img)
self.garment_preview.image = tk_img # Keep a reference
except Exception as e:
self.status_label.config(text=f"Error loading preview: {e}")
def start_tryon(self):
"""Start the virtual try-on"""
if not self.garment_path:
self.status_label.config(text="Please select a garment first")
return
if self.running:
self.status_label.config(text="Already running")
return
try:
# Initialize the virtual try-on application
self.app = AdvancedVirtualTryOn(
self.garment_path,
self.webcam_index,
f"{self.width}x{self.height}"
)
# Set initial parameters
self.update_params()
# Start the webcam
self.running = True
self.status_label.config(text="Try-on started")
# Start updating frames
self.update_frame()
except Exception as e:
self.status_label.config(text=f"Error starting try-on: {e}")
def update_params(self, *args):
"""Update the application parameters from UI controls"""
if self.app:
self.app.width_scale = self.width_scale_var.get()
self.app.height_scale = self.height_scale_var.get()
self.app.collar_position = self.collar_var.get()
self.app.debug_mode = self.debug_var.get()
def update_frame(self):
"""Update the webcam frame"""
if not self.running or not self.app:
return
try:
# Get frame from camera
ret, frame = self.app.camera.read()
if ret:
# Process the frame
processed = self.app.process_frame(frame)
# Convert to PIL format
pil_img = Image.fromarray(cv2.cvtColor(processed, cv2.COLOR_BGR2RGB))
# Convert to Tkinter format
tk_img = ImageTk.PhotoImage(image=pil_img)
# Update image
self.webcam_label.config(image=tk_img)
self.webcam_label.image = tk_img # Keep a reference
# Schedule next update
self.root.after(self.update_interval, self.update_frame)
except Exception as e:
self.status_label.config(text=f"Error updating frame: {e}")
self.stop_tryon()
def stop_tryon(self):
"""Stop the virtual try-on"""
self.running = False
if self.app:
self.app.clean_up()
self.app = None
self.status_label.config(text="Try-on stopped")
def on_close(self):
"""Handle window close event"""
self.stop_tryon()
if self.root:
self.root.destroy()
def run_tkinter_app(webcam_index=0, resolution="640x480"):
"""Run the application with Tkinter UI"""
# Check if Tkinter is available
try:
import tkinter as tk
tk_available = True
except ImportError:
print("Tkinter is not available in this environment. Cannot run Tkinter UI.")
print("Try running with --shiny instead.")
tk_available = False
return
ui = TkinterUI(webcam_index, resolution)
ui.start()
def run_shiny_app():
"""Run the application in Shiny mode"""
app_ui = ui.page_fluid(
ui.tags.head(
ui.tags.title("Advanced Virtual Try-On"),
ui.tags.style("""
.container { max-width: 1200px; }
.row { margin-bottom: 20px; }
.col-md-6 { padding: 10px; }
.well { background-color: #f8f9fa; padding: 15px; border-radius: 5px; }
.form-group { margin-bottom: 15px; }
.control-label { font-weight: bold; }
.img-preview { max-width: 100%; height: auto; }
.info-box { background-color: #e6f7ff; padding: 15px; border-radius: 5px; margin-bottom: 15px; }
.sample-btn { margin-top: 10px; }
""")
),
ui.div(
{"class": "container"},
ui.h1("Advanced Virtual Try-On"),
ui.p("Try on clothing virtually using your webcam"),
# Info box for Hugging Face
ui.div(
{"class": "info-box"},
ui.h4("Welcome to Virtual Try-On!"),
ui.p("1. Upload a garment image with transparent background, or use the sample garment"),
ui.p("2. Click 'Start Try-On' to virtually try on the garment"),
ui.p("3. Adjust the fit using the sliders below")
),
ui.div(
{"class": "row"},
ui.div(
{"class": "col-md-6"},
ui.div(
{"class": "well"},
ui.h3("Settings"),
ui.input_file("garment_upload", "Upload Garment Image",
accept=[".png", ".jpg", ".jpeg"]),
ui.div(
{"class": "sample-btn"},
ui.input_action_button("use_sample", "Use Sample Garment",
class_="btn-info")
),
ui.div(
{"class": "form-group"},
ui.input_slider("width_scale", "Width Scale",
min=0.8, max=3.0, value=1.2, step=0.1),
ui.input_slider("height_scale", "Height Scale",
min=0.6, max=2.0, value=1.1, step=0.1),
ui.input_slider("collar_position", "Collar Position",
min=0.05, max=0.3, value=0.2, step=0.01),
ui.input_checkbox("debug_mode", "Show Skeleton", value=False)
),
ui.div(
{"class": "form-group"},
ui.input_action_button("start_button", "Start Try-On",
class_="btn-primary"),
ui.input_action_button("stop_button", "Stop",
class_="btn-danger")
)
)
),
ui.div(
{"class": "col-md-6"},
ui.div(
{"class": "well"},
ui.h3("Preview"),
ui.output_image("garment_preview"),
ui.h3("Live Try-On"),
ui.output_image("webcam_feed")
)
)
)
)
)
def server(input, output, session):
# Initialize reactive values
app = reactive.Value(None)
is_running = reactive.Value(False)
temp_garment_file = reactive.Value(None)
# Create sample garment directory and file
def create_sample_garment():
# Create a simple t-shirt shape with alpha channel
width, height = 400, 500
img = np.zeros((height, width, 4), dtype=np.uint8)
# Draw a simple t-shirt shape
# Body of the shirt
cv2.rectangle(img, (100, 150), (300, 450), (0, 0, 255, 255), -1)
# Sleeves
cv2.rectangle(img, (50, 150), (100, 250), (0, 0, 255, 255), -1)
cv2.rectangle(img, (300, 150), (350, 250), (0, 0, 255, 255), -1)
# Neck cut
cv2.rectangle(img, (150, 100), (250, 150), (0, 0, 0, 0), -1)
# Save to a temp file
os.makedirs('temp', exist_ok=True)
sample_path = os.path.join('temp', 'sample_tshirt.png')
cv2.imwrite(sample_path, img)
return sample_path
@reactive.Effect
@reactive.event(input.garment_upload)
def handle_garment_upload():
if input.garment_upload() is not None:
# Save uploaded file to temp
temp_file = tempfile.NamedTemporaryFile(delete=False, suffix=".png")
temp_file.write(input.garment_upload()["datapath"])
temp_file.close()
temp_garment_file.set(temp_file.name)
@reactive.Effect
@reactive.event(input.use_sample)
def use_sample_garment():
sample_path = create_sample_garment()
temp_garment_file.set(sample_path)
ui.notification_show("Using sample garment", type="info")
@reactive.Effect
@reactive.event(input.start_button)
def start_tryon():
if not temp_garment_file.get():
ui.notification_show("Please upload a garment or use the sample", type="warning")
return
if not is_running.get():
try:
app.set(AdvancedVirtualTryOn(
temp_garment_file.get(),
0,
"640x480",
shiny_mode=True
))
is_running.set(True)
ui.notification_show("Try-on started", type="success")
except Exception as e:
ui.notification_show(f"Error starting try-on: {e}", type="error")
@reactive.Effect
@reactive.event(input.stop_button)
def stop_tryon():
if is_running.get():
if app.get():
app.get().clean_up()
is_running.set(False)
ui.notification_show("Try-on stopped", type="info")
@output
@render.image
def garment_preview():
if temp_garment_file.get():
try:
img = Image.open(temp_garment_file.get())
# Convert to base64
buffered = io.BytesIO()
img.save(buffered, format="PNG")
img_str = base64.b64encode(buffered.getvalue()).decode()
return ImgData(src=f"data:image/png;base64,{img_str}")
except Exception as e:
print(f"Error displaying garment preview: {e}")
return None
@output
@render.image
def webcam_feed():
if is_running.get() and app.get():
try:
# Get frame from camera
ret, frame = app.get().camera.read()
if ret:
# Process the frame
processed = app.get().process_frame(frame)
# Convert to PIL Image
img = Image.fromarray(cv2.cvtColor(processed, cv2.COLOR_BGR2RGB))
# Convert to base64
buffered = io.BytesIO()
img.save(buffered, format="JPEG")
img_str = base64.b64encode(buffered.getvalue()).decode()
return ImgData(src=f"data:image/jpeg;base64,{img_str}")
except Exception as e:
ui.notification_show(f"Error processing frame: {e}", type="error")
return None
# Update app parameters when sliders change
@reactive.Effect
def update_params():
if app.get():
app.get().width_scale = input.width_scale()
app.get().height_scale = input.height_scale()
app.get().collar_position = input.collar_position()
app.get().debug_mode = input.debug_mode()
# Set default sample garment on startup
if os.environ.get('SPACE_ID') is not None:
# If running on Hugging Face, automatically load sample garment
sample_path = create_sample_garment()
temp_garment_file.set(sample_path)
return App(app_ui, server)
def main():
# Check if running on Hugging Face Spaces
is_huggingface = os.environ.get('SPACE_ID') is not None
args = parse_args()
try:
# When running on Hugging Face, automatically use Shiny mode
if is_huggingface:
print("Running on Hugging Face Spaces. Starting in Shiny mode...")
app = run_shiny_app()
app.run(host="0.0.0.0", port=int(os.environ.get('PORT', 8000)))
# Otherwise, check command line arguments
elif args.shiny:
app = run_shiny_app()
app.run(host="0.0.0.0", port=8000)
elif args.tkinter or (not args.garment and not args.shiny):
# Check if Tkinter is available before trying to use it
try:
import tkinter
# Use tkinter by default if no garment is specified
run_tkinter_app(args.webcam, args.resolution)
except ImportError:
print("Tkinter is not available. Falling back to Shiny mode.")
app = run_shiny_app()
app.run(host="0.0.0.0", port=8000)
else:
# Traditional command-line mode if garment is specified
width, height = map(int, args.resolution.split('x'))
app = AdvancedVirtualTryOn(args.garment, args.webcam, args.resolution)
app.run()
except Exception as e:
print(f"Error: {e}")
import traceback
traceback.print_exc()
if __name__ == "__main__":
main()