Spaces:

BestWJH
/

PEAR

Build error

App Files Files Community

PEAR / app.py

BestWJH

Update app.py

4abbc1c verified about 1 month ago

raw

history blame contribute delete

29.9 kB

	import os
	import shutil
	import site
	import sys
	import importlib

	def migrate_precompiled_packages():
	# 1. 获取目标 site-packages 路径
	target_site_packages = site.getsitepackages()[0]

	# 定义需要迁移的包及其对应的关键模块名（用于存在性检查）
	packages_to_check = {
	'pytorch3d': ['pytorch3d', 'pytorch3d-0.7.8.dist-info'],
	'chumpy': ['chumpy', 'chumpy-0.70.dist-info']
	}

	print(f"📦 Starting migration check in: {os.getcwd()}")

	for pkg_name, folders in packages_to_check.items():
	# 检查包是否已经安装且可用
	try:
	importlib.import_module(pkg_name)
	print(f"✅ {pkg_name} is already available. Skipping.")
	continue
	except ImportError:
	print(f"🔍 {pkg_name} not found. Preparing to migrate...")

	for folder in folders:
	src = os.path.abspath(folder)
	dst = os.path.join(target_site_packages, folder)

	if os.path.exists(src):
	try:
	if os.path.exists(dst):
	print(f"⚠️ Removing existing {dst}...")
	shutil.rmtree(dst) if os.path.isdir(dst) else os.remove(dst)

	print(f"🚚 Copying {folder} to site-packages...")
	shutil.copytree(src, dst)
	except Exception as e:
	print(f"❌ Failed to migrate {folder}: {e}")
	else:
	print(f"❓ Source {folder} missing in root directory.")

	# 2. 核心补丁：刷新搜索路径并置顶
	importlib.invalidate_caches()
	if target_site_packages not in sys.path:
	sys.path.insert(0, target_site_packages)

	# 3. 针对 PyTorch3D 的动态链接补丁 (解决 libc10.so 找不到的问题)
	try:
	import torch
	torch_lib_path = os.path.join(os.path.dirname(torch.__file__), "lib")
	os.environ["LD_LIBRARY_PATH"] = torch_lib_path + ":" + os.environ.get("LD_LIBRARY_PATH", "")
	print(f"🔗 LD_LIBRARY_PATH updated with torch libs.")
	except Exception as e:
	print(f"⚠️ Failed to set LD_LIBRARY_PATH: {e}")

	# 执行迁移
	migrate_precompiled_packages()

	# 验证安装
	try:
	import chumpy
	import pytorch3d
	from pytorch3d import _C
	print(f"🎉 All systems go! PyTorch3D GPU: {hasattr(_C, 'rasterize_meshes')}")
	except Exception as e:
	print(f"🚨 Validation failed: {e}")


	import gradio as gr
	import os
	import json
	import numpy as np
	import cv2
	import base64
	import time
	import shutil
	import glob
	from pathlib import Path
	from typing import List, Tuple, Union
	from concurrent.futures import ThreadPoolExecutor
	import atexit
	import uuid
	import logging
	from huggingface_hub import hf_hub_download
	import torch
	import decord
	try:
	import spaces
	except ImportError:
	# Fallback for local development
	def space(func):
	return func
	import imageio

	from einops import rearrange

	from models.modules.ehm import EHM_v2
	from models.pipeline.ehm_pipeline import Ehm_Pipeline
	from utils.pipeline_utils import to_tensor
	from utils.graphics_utils import GS_Camera
	from models.modules.renderer.body_renderer import Renderer2 as BodyRenderer
	from pytorch3d.renderer import PointLights
	from utils.general_utils import (
	ConfigDict,
	rtqdm,
	device_parser,
	add_extra_cfgs,
	)
	from scipy.signal import savgol_filter
	try:
	import spaces # for HuggingFace Spaces
	except ImportError:
	# Fallback for local development
	def spaces(func):
	return func


	logger = logging.getLogger(__name__)

	# -------------------------------------------------------------------------
	# Device & runtime configuration (CPU / GPU agnostic)
	# -------------------------------------------------------------------------
	TORCH_DEVICE = torch.device("cuda" if torch.cuda.is_available() else "cpu")
	ORT_PROVIDERS = ["CUDAExecutionProvider", "CPUExecutionProvider"]



	meta_cfg = ConfigDict(
	model_config_path=os.path.join("configs", "infer.yaml")
	)
	meta_cfg = add_extra_cfgs(meta_cfg)

	# Renderer / model init (on selected device)
	body_renderer = BodyRenderer("assets/SMPLX", 1024, focal_length=24.0)


	repo_id = "BestWJH/PEAR_models"
	filename = "ehm_model_stage1.pt"

	ehm_basemodel = hf_hub_download(repo_id=repo_id, filename=filename, repo_type="model")
	ehm_model = Ehm_Pipeline(meta_cfg)

	_state = torch.load(ehm_basemodel, map_location='cpu', weights_only=True)
	ehm_model.backbone.load_state_dict(_state['backbone'], strict=False)
	ehm_model.head.load_state_dict(_state['head'], strict=False)

	ehm = EHM_v2("assets/FLAME", "assets/SMPLX", "assets/MANO")


	# lights = PointLights(device=TORCH_DEVICE, location=[[0.0, -1.0, -10.0]])

	# 2. 将 lights 的初始化移入函数，或确保它能动态转换
	def get_lights(device):
	return PointLights(device=device, location=[[0.0, -1.0, -10.0]])




	# Thread pool for delayed deletion
	thread_pool_executor = ThreadPoolExecutor(max_workers=2)

	def build_cameras_kwargs(batch_size, focal_length):
	screen_size = (
	torch.tensor([1024, 1024], device=TORCH_DEVICE)
	.float()[None]
	.repeat(batch_size, 1)
	)
	cameras_kwargs = {
	"principal_point": torch.zeros(batch_size, 2, device=TORCH_DEVICE).float(),
	"focal_length": focal_length,
	"image_size": screen_size,
	"device": TORCH_DEVICE,
	}
	return cameras_kwargs



	def pad_and_resize(img, target_size=512):

	h, w = img.shape[:2]

	# 等比例缩放
	scale = min(target_size / h, target_size / w)
	new_w, new_h = int(w * scale), int(h * scale)
	resized_img = cv2.resize(img, (new_w, new_h), interpolation=cv2.INTER_LINEAR)

	# 创建黑色背景图像并粘贴到中心
	padded_img = np.zeros((target_size, target_size, 3), dtype=np.uint8)
	x_offset = (target_size - new_w) // 2
	y_offset = (target_size - new_h) // 2
	padded_img[y_offset:y_offset + new_h, x_offset:x_offset + new_w] = resized_img

	return padded_img

	def delete_later(path: Union[str, os.PathLike], delay: int = 600):
	"""Delete file or directory after specified delay (default 10 minutes)"""
	def _delete():
	try:
	if os.path.isfile(path):
	os.remove(path)
	elif os.path.isdir(path):
	shutil.rmtree(path)
	except Exception as e:
	logger.warning(f"Failed to delete {path}: {e}")

	def _wait_and_delete():
	time.sleep(delay)
	_delete()

	thread_pool_executor.submit(_wait_and_delete)
	atexit.register(_delete)


	def create_user_temp_dir():
	"""Create a unique temporary directory for each user session"""
	session_id = str(uuid.uuid4())[:8] # Short unique ID
	PROJECT_ROOT = os.path.dirname(os.path.abspath(__file__))
	temp_dir = os.path.join(
	PROJECT_ROOT, "temp_local", f"session_{session_id}"
	)

	os.makedirs(temp_dir, exist_ok=True)

	# Schedule deletion after 10 minutes
	delete_later(temp_dir, delay=600)

	return temp_dir

	def get_video_name(video_path):
	"""Extract video name without extension"""
	return os.path.splitext(os.path.basename(video_path))[0]

	def extract_first_frame(video_path):
	"""Extract first frame from video file"""
	try:
	cap = cv2.VideoCapture(video_path)
	ret, frame = cap.read()
	cap.release()

	if ret:
	frame_rgb = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
	return frame_rgb
	else:
	return None
	except Exception as e:
	print(f"Error extracting first frame: {e}")
	return None

	def numpy_to_base64(arr):
	"""Convert numpy array to base64 string"""
	return base64.b64encode(arr.tobytes()).decode('utf-8')


	def polynomial_smooth(sequence, window_size=5, polyorder=2):

	seq = np.asarray(sequence.cpu())
	if seq.ndim < 2:
	raise ValueError(f"输入必须至少是 2 维，当前 shape={seq.shape}")

	if window_size % 2 == 0:
	raise ValueError("window_size 必须是奇数")
	if polyorder >= window_size:
	raise ValueError("polyorder 必须小于 window_size")

	# Savitzky–Golay 沿着 axis=0 (时间维) 平滑
	smoothed = savgol_filter(seq, window_length=window_size, polyorder=polyorder, axis=0, mode='interp')
	return smoothed


	def handle_video_upload(video):
	"""Handle video upload and extract first frame"""
	if video is None:
	return None

	# Create user-specific temporary directory
	user_temp_dir = create_user_temp_dir()

	# Get original video name and copy to temp directory
	# if isinstance(video, str):
	# video_name = get_video_name(video)
	# video_path = os.path.join(user_temp_dir, f"{video_name}.mp4")
	# shutil.copy(video, video_path)
	# else:
	# video_name = get_video_name(video.name)
	# video_path = os.path.join(user_temp_dir, f"{video_name}.mp4")
	# with open(video_path, 'wb') as f:
	# f.write(video.read())

	# 确定输入源路径/
	input_source = video if isinstance(video, str) else video.name

	video_name = get_video_name(input_source)
	video_path = os.path.join(user_temp_dir, f"{video_name}.mp4")

	try:
	# 使用 imageio 读取视频
	reader = imageio.get_reader(input_source)
	meta_data = reader.get_meta_data()
	fps = meta_data.get('fps', 30)
	max_frames = int(fps * 3)
	writer = imageio.get_writer(video_path, fps=fps, codec='libx264', quality=8)

	for i, frame in enumerate(reader):
	if i >= max_frames:
	break
	writer.append_data(frame)

	reader.close()
	writer.close()
	print(f"成功截取前 3 秒视频并保存至: {video_path}")

	except Exception as e:
	print(f"imageio 处理视频失败: {e}")


	print(f"📁 Video saved to: {video_path}")

	# Extract first frame
	frame = extract_first_frame(video_path)
	if frame is None:
	return None

	# Resize frame to have minimum side length of 336
	h, w = frame.shape[:2]
	scale = 336 / min(h, w)
	new_h, new_w = int(h * scale)//22, int(w scale)//2*2
	frame = cv2.resize(frame, (new_w, new_h), interpolation=cv2.INTER_LINEAR)

	# Store frame data with temp directory info
	frame_data = {
	'data': numpy_to_base64(frame),
	'shape': frame.shape,
	'dtype': str(frame.dtype),
	'temp_dir': user_temp_dir,
	'video_name': video_name,
	'video_path': video_path
	}

	# Get video-specific settings
	print(f"🎬 Video path: '{video}' -> Video name: '{video_name}'")

	return (json.dumps(frame_data) )

	@spaces.GPU
	@torch.no_grad()
	def mesh_inference(temp_dir, video_name):

	global body_renderer, ehm_model, ehm
	body_renderer = body_renderer.to(TORCH_DEVICE)
	ehm_model = ehm_model.to(TORCH_DEVICE)
	ehm = ehm.to(TORCH_DEVICE)
	lights = get_lights(TORCH_DEVICE)

	# ... 后续推理逻辑 ...
	# Setup paths
	video_path = os.path.join(temp_dir, f"{video_name}.mp4")

	out_dir = os.path.join(temp_dir, "results")
	os.makedirs(out_dir, exist_ok=True)

	# Load video using decord
	video_reader = decord.VideoReader(video_path)
	# Don't load all frames at once; process frame-by-frame to save memory.


	# Run the EHM pipeline
	print(f"🎯 Running EHM pipeline...")
	ehm_out_dir = os.path.join(out_dir, "ehm_results")
	os.makedirs(ehm_out_dir, exist_ok=True)



	all_meshes_img = []
	vertices_list = []
	body_sequence = []
	flame_sequence = []
	cam_sequence = []
	# Process each frame with EHM
	for i in range(len(video_reader)):
	frame = video_reader[i].asnumpy()
	# TODO: Apply EHM processing to frame
	resized = pad_and_resize(frame, target_size=256)
	img_patch = to_tensor(resized, TORCH_DEVICE) # (B, C, H, W)
	img_patch = torch.permute(img_patch/255,(2,0,1)).unsqueeze(0)

	outputs = ehm_model(img_patch) # 转移到 cuda 了


	body_sequence.append(outputs['body_param'])
	flame_sequence.append(outputs['flame_param'])
	cam_sequence.append(outputs['pd_cam'])


	fields1 = [
	"global_pose", "body_pose", "left_hand_pose", "right_hand_pose",
	"hand_scale", "head_scale", "exp", "shape"
	]

	processed1 = {}
	for key in fields1:
	data_list = [seq[key] for seq in body_sequence]
	data_tensor = torch.cat(data_list, dim=0)
	processed1[key] = torch.tensor(polynomial_smooth(data_tensor, window_size=7, polyorder=2)).cuda()

	global_pose = processed1["global_pose"]
	body_pose = processed1["body_pose"]
	left_hand_pose = processed1["left_hand_pose"]
	right_hand_pose = processed1["right_hand_pose"]
	hand_scale = processed1["hand_scale"]
	head_scale = processed1["head_scale"]
	exp = processed1["exp"]
	shape = processed1["shape"]

	# 第二步：从 eye_pose_params 中提取字段并平滑
	fields2 = [
	"eye_pose_params", "pose_params", "jaw_params",
	"eyelid_params", "expression_params", "shape_params"
	]

	processed2 = {}
	for key in fields2:
	data_list = [seq[key] for seq in flame_sequence] # 这里我猜你原意是从 eye_pose_params 取
	data_tensor = torch.cat(data_list, dim=0)
	processed2[key] = torch.tensor(polynomial_smooth(data_tensor, window_size=5, polyorder=2)).cuda()

	eye_pose_params = processed2["eye_pose_params"]
	pose_params = processed2["pose_params"]
	jaw_params = processed2["jaw_params"]
	eyelid_params = processed2["eyelid_params"]
	expression_params = processed2["expression_params"]
	shape_params = processed2["shape_params"]


	cam_sequence = torch.cat(cam_sequence, dim=0)
	cam_sequence = torch.tensor(polynomial_smooth(cam_sequence, window_size=7, polyorder=2)).cuda()




	for idx in range(global_pose.shape[0]):

	pd_cam = cam_sequence[idx:idx+1]

	body_dict = {
	"global_pose": global_pose[idx:idx+1],
	"body_pose" : body_pose[idx:idx+1],
	"left_hand_pose" : left_hand_pose[idx:idx+1],
	"right_hand_pose" : right_hand_pose[idx:idx+1],
	"hand_scale" : hand_scale[idx:idx+1],
	"head_scale" : head_scale[idx:idx+1],
	"exp" : exp[idx:idx+1] ,
	"shape": shape[idx:idx+1],
	'eye_pose' :None,
	'jaw_pose' : None,
	'joints_offset' : None
	}
	flame_dict ={
	"eye_pose_params" : eye_pose_params[idx:idx+1],
	"pose_params" : pose_params[idx:idx+1],
	"jaw_params" : jaw_params[idx:idx+1],
	"eyelid_params" : eyelid_params[idx:idx+1],
	"expression_params" : expression_params[idx:idx+1] ,
	"shape_params": shape_params[idx:idx+1]
	}

	pd_smplx_dict = ehm(body_dict, flame_dict, pose_type='aa')
	pd_camera = GS_Camera(**build_cameras_kwargs(1,24), R = pd_cam[0:1,:3,:3], T = pd_cam[0:1,:3,3])
	pd_mesh_img = body_renderer.render_mesh(pd_smplx_dict['vertices'][None, 0,...], pd_camera, lights=lights,)
	pd_mesh_img = (pd_mesh_img[:,:3].detach().cpu().numpy()).clip(0, 255).astype(np.uint8)[0].transpose(1,2,0)
	# pd_mesh_img = cv2.cvtColor(pd_mesh_img.copy(), cv2.COLOR_RGB2BGR)
	all_meshes_img.append(pd_mesh_img)

	# vertices_list.append(pd_smplx_dict['vertices'][0, :-120].detach().cpu().numpy())



	# Save results
	mesh_video_path = os.path.join(out_dir, "mesh_video.mp4")
	# Write a browser-compatible MP4:
	# - H.264 + yuv420p for broad HTML5 support
	# - faststart so it can stream/play immediately
	if len(all_meshes_img) == 0:
	raise RuntimeError("No frames generated for mesh video.")
	fps = 30
	try:
	writer = imageio.get_writer(
	mesh_video_path,
	fps=fps,
	codec="libx264",
	pixelformat="yuv420p",
	ffmpeg_params=["-movflags", "faststart"],
	macro_block_size=None,
	)
	for img in all_meshes_img:
	# Ensure even H/W for yuv420p
	h, w = img.shape[:2]
	img2 = img[: h - (h % 2), : w - (w % 2)]
	writer.append_data(img2)
	writer.close()
	except Exception as e:
	print(f"⚠️ imageio ffmpeg writer failed ({e}); falling back to mimwrite")
	imageio.mimwrite(mesh_video_path, all_meshes_img, fps=fps)

	# Save a portable npz (avoid storing Trimesh objects which will fail).
	# vertices: (T, V, 3), faces: (F, 3)
	faces = body_renderer.faces[0].detach().cpu().numpy()
	vertices = np.stack(vertices_list, axis=0) if len(vertices_list) > 0 else np.empty((0, 0, 3), dtype=np.float32)
	np.savez_compressed(os.path.join(out_dir, "results.npz"), vertices=vertices, faces=faces)


	print(f"✅ EHM processing completed.")



	# @torch.no_grad()
	def launch_viz(original_image_state):
	"""Launch visualization with user-specific temp directory"""
	if original_image_state is None:
	return None, None

	try:
	# Get user's temp directory from stored frame data
	frame_data = json.loads(original_image_state)

	temp_dir = frame_data.get("temp_dir", "temp_local")
	video_name = frame_data.get("video_name", "video")

	print(f"🚀 Starting recover for video: {video_name}")

	# Run tracker
	print("🎯 Running...")
	out_dir = os.path.join(temp_dir, "results")
	os.makedirs(out_dir, exist_ok=True)

	mesh_inference(temp_dir, video_name)

	delete_later(temp_dir, delay=600)

	npz_path = os.path.join(out_dir, "results.npz")
	mesh_video = os.path.join(out_dir, "mesh_video.mp4")

	if os.path.exists(mesh_video):
	print("✅ Tracking completed successfully!")
	# Returning the path lets gr.Video handle file serving & controls
	return mesh_video, (npz_path if os.path.exists(npz_path) else None)
	else:
	print("❌ Tracking failed - no results generated")
	return None, None

	except Exception as e:
	print(f"❌ Error in launch_viz: {e}")
	return None, None



	# Create the Gradio interface
	print("🎨 Creating Gradio interface...")

	with gr.Blocks(
	theme=gr.themes.Soft(),
	title="🎯 [PEAR](https://wujh2001.github.io/PEAR/)",
	css="""
	.gradio-container {
	max-width: 1200px !important;
	margin: auto !important;
	}
	.gr-button {
	margin: 5px;
	}
	.gr-form {
	background: white;
	border-radius: 10px;
	padding: 20px;
	box-shadow: 0 2px 10px rgba(0,0,0,0.1);
	}
	/* 移除 gr.Group 的默认灰色背景 */
	.gr-form {
	background: transparent !important;
	border: none !important;
	box-shadow: none !important;
	padding: 0 !important;
	}
	/* 固定3D可视化器尺寸（纯白卡片样式） */
	#viz_container {
	height: 650px !important;
	min-height: 650px !important;
	max-height: 650px !important;
	width: 100% !important;
	margin: 0 !important;
	padding: 12px !important;
	overflow: hidden !important;
	box-sizing: border-box !important;
	border-radius: 14px !important;
	border: 1px solid rgba(148, 163, 184, 0.6) !important;
	background: #ffffff !important;
	box-shadow: 0 10px 24px rgba(15, 23, 42, 0.12) !important;
	display: flex !important;
	align-items: center !important;
	justify-content: center !important;
	}
	/* 固定“左侧上传”视频组件高度（不要影响右侧结果视频） */
	#video_input {
	height: 300px !important;
	min-height: 300px !important;
	max-height: 300px !important;
	}
	#video_input video {
	height: 260px !important;
	max-height: 260px !important;
	object-fit: contain !important;
	background: #f8f9fa;
	}
	#video_input .gr-video-player {
	height: 260px !important;
	max-height: 260px !important;
	}

	/* 强力移除examples的灰色背景 - 使用更通用的选择器 */
	.horizontal-examples,
	.horizontal-examples > *,
	.horizontal-examples * {
	background: transparent !important;
	background-color: transparent !important;
	border: none !important;
	}

	/* Examples组件水平滚动样式 */
	.horizontal-examples [data-testid="examples"] {
	background: transparent !important;
	background-color: transparent !important;
	}

	.horizontal-examples [data-testid="examples"] > div {
	background: transparent !important;
	background-color: transparent !important;
	overflow-x: auto !important;
	overflow-y: hidden !important;
	scrollbar-width: thin;
	scrollbar-color: #667eea transparent;
	padding: 0 !important;
	margin-top: 10px;
	border: none !important;
	}

	.horizontal-examples [data-testid="examples"] table {
	display: flex !important;
	flex-wrap: nowrap !important;
	min-width: max-content !important;
	gap: 15px !important;
	padding: 10px 0;
	background: transparent !important;
	border: none !important;
	}

	.horizontal-examples [data-testid="examples"] tbody {
	display: flex !important;
	flex-direction: row !important;
	flex-wrap: nowrap !important;
	gap: 15px !important;
	background: transparent !important;
	}

	.horizontal-examples [data-testid="examples"] tr {
	display: flex !important;
	flex-direction: column !important;
	min-width: 160px !important;
	max-width: 160px !important;
	margin: 0 !important;
	background: white !important;
	border-radius: 12px;
	box-shadow: 0 3px 12px rgba(0,0,0,0.12);
	transition: all 0.3s ease;
	cursor: pointer;
	overflow: hidden;
	border: none !important;
	}

	.horizontal-examples [data-testid="examples"] tr:hover {
	transform: translateY(-4px);
	box-shadow: 0 8px 20px rgba(102, 126, 234, 0.25);
	}

	.horizontal-examples [data-testid="examples"] td {
	text-align: center !important;
	padding: 0 !important;
	border: none !important;
	background: transparent !important;
	}

	.horizontal-examples [data-testid="examples"] td:first-child {
	padding: 0 !important;
	background: transparent !important;
	}

	.horizontal-examples [data-testid="examples"] video {
	border-radius: 8px 8px 0 0 !important;
	width: 100% !important;
	height: 90px !important;
	object-fit: cover !important;
	background: #f8f9fa !important;
	}

	.horizontal-examples [data-testid="examples"] td:last-child {
	font-size: 11px !important;
	font-weight: 600 !important;
	color: #333 !important;
	padding: 8px 12px !important;
	background: linear-gradient(135deg, #f8f9ff 0%, #e6f3ff 100%) !important;
	border-radius: 0 0 8px 8px;
	}

	/* 滚动条样式 */
	.horizontal-examples [data-testid="examples"] > div::-webkit-scrollbar {
	height: 8px;
	}
	.horizontal-examples [data-testid="examples"] > div::-webkit-scrollbar-track {
	background: transparent;
	border-radius: 4px;
	}
	.horizontal-examples [data-testid="examples"] > div::-webkit-scrollbar-thumb {
	background: linear-gradient(135deg, #667eea 0%, #764ba2 100%);
	border-radius: 4px;
	}
	.horizontal-examples [data-testid="examples"] > div::-webkit-scrollbar-thumb:hover {
	background: linear-gradient(135deg, #5a6fd8 0%, #6a4190 100%);
	}
	"""
	) as demo:

	# Add prominent main title

	gr.Markdown("""
	# ✨ PEAR

	Welcome to [PEAR](https://wujh2001.github.io/PEAR/)! This interface allows you to human mesh from a single image.
	Please cite our paper and give us a star 🌟 if you find this project useful!

	⚡ Quick Start: Upload video → Click "Start Tracking Now!"

	🔬 Advanced Usage with PEAR:

	""")

	# Status indicator
	status_indicator = gr.Markdown("Reminder: 🟢 This app currently only supports single human-centered video inputs (up to 3 seconds). For other input types, users can customize the application manually. In addition, the model used here is not our final version (Used in our paper and project page); the complete model will be officially released in a few months.")

	# Main content area - video upload left, 3D visualization right
	with gr.Row():
	with gr.Column(scale=1):
	# Video upload section
	gr.Markdown("### 📂 Select Video")

	# Define video_input here so it can be referenced in examples
	video_input = gr.Video(
	label="Upload Video or Select Example",
	format="mp4",
	height=250, # Matched height with 3D viz
	elem_id="video_input"
	)


	# Traditional examples but with horizontal scroll styling
	gr.Markdown("🎨Examples: (scroll horizontally to see all videos)")
	with gr.Row(elem_classes=["horizontal-examples"]):
	# Horizontal video examples with slider
	# gr.HTML("<div style='margin-top: 5px;'></div>")
	gr.Examples(
	examples=[
	["example/example_1.mp4"],
	["example/example_2.mp4"],
	],
	inputs=[video_input],
	outputs=[video_input],
	fn=None,
	cache_examples=False,
	label="",
	examples_per_page=6 # Show 6 examples per page so they can wrap to multiple rows
	)

	with gr.Column(scale=2):
	# 3D Visualization - wider and taller to match left side
	with gr.Group():
	gr.Markdown("### ✨ Human Mesh Visualization")
	# Output-only video: no upload controls, only play the result
	viz_video = gr.Video(
	label="Reconstructed Human Mesh Video",
	height=650,
	elem_id="viz_container",
	interactive=False,
	autoplay=False,
	sources=None, # hide upload / webcam buttons
	)

	# Start button section - below video area
	with gr.Row():
	with gr.Column(scale=3):
	launch_btn = gr.Button("🚀 Start Tracking Now!", variant="primary", size="lg")
	with gr.Column(scale=1):
	clear_all_btn = gr.Button("🗑️ Clear All", variant="secondary", size="sm")

	# Downloads section - visible download area
	with gr.Row():
	with gr.Column():
	parameters_download = gr.File(
	label="📄 Download Mesh Results (vertices and faces)",
	interactive=False,
	)


	# GitHub Star Section
	gr.HTML("""
	<div style='background: linear-gradient(135deg, #e8eaff 0%, #f0f2ff 100%);
	border-radius: 8px; padding: 20px; margin: 15px 0;
	box-shadow: 0 2px 8px rgba(102, 126, 234, 0.1);
	border: 1px solid rgba(102, 126, 234, 0.15);'>
	<div style='text-align: center;'>
	<h3 style='color: #4a5568; margin: 0 0 10px 0; font-size: 18px; font-weight: 600;'>
	⭐ Love PEAR? Give us a Star! ⭐
	</h3>
	<p style='color: #666; margin: 0 0 15px 0; font-size: 14px; line-height: 1.5;'>
	Help us grow by starring our repository on GitHub! Your support means a lot to the community. 🚀
	</p>
	<a href="https://wujh2001.github.io/PEAR/" target="_blank"
	style='display: inline-flex; align-items: center; gap: 8px;
	background: rgba(102, 126, 234, 0.1); color: #4a5568;
	padding: 10px 20px; border-radius: 25px; text-decoration: none;
	font-weight: bold; font-size: 14px; border: 1px solid rgba(102, 126, 234, 0.2);
	transition: all 0.3s ease;'
	onmouseover="this.style.background='rgba(102, 126, 234, 0.15)'; this.style.transform='translateY(-2px)'"
	onmouseout="this.style.background='rgba(102, 126, 234, 0.1)'; this.style.transform='translateY(0)'">
	<span style='font-size: 16px;'>⭐</span>
	Star PEAR on GitHub
	</a>
	</div>
	</div>
	""")


	# Footer
	gr.HTML("""
	<div style='text-align: center; margin: 20px 0 10px 0;'>
	<span style='font-size: 12px; color: #888; font-style: italic;'>
	Powered by PEAR \| Built with ❤️ for the Computer Vision Community
	</span>
	</div>
	""")


	# Hidden state variables
	original_image_state = gr.State(None)



	# # Event handlers
	video_input.change(
	fn=handle_video_upload,
	inputs=[video_input],
	outputs=[original_image_state],
	api_name=False # ⭐ 关键
	)

	launch_btn.click(
	fn=launch_viz,
	inputs=[original_image_state],
	outputs=[viz_video, parameters_download],
	api_name=False # ⭐ 关键
	)


	# Launch the interface
	if __name__ == "__main__":
	print("🌟 Launching PEAR Local Version...")
	print("🔗 Running in Local Processing Mode")
	demo.queue().launch()