Spaces:

b2bomber
/

Video-Enhancer

Running

App Files Files Community

b2bomber commited on Jul 18, 2025

Commit

19467f5

verified ·

1 Parent(s): f114dc6

Update app.py

Browse files

Files changed (1) hide show

app.py +28 -61

app.py CHANGED Viewed

@@ -11,15 +11,12 @@ from realesrgan.archs.srvgg_arch import SRVGGNetCompact
 from gfpgan import GFPGANer
 from basicsr.utils.download_util import load_file_from_url
-# --- Model Loading ---
-# We create a dictionary to cache models so they are only loaded once.
 model_cache = {}
 def get_upsampler(model_name='realesr-general-x4v3'):
-    """Loads and returns the specified RealESRGAN model."""
     if model_name in model_cache:
         return model_cache[model_name]
     if model_name == 'RealESRGAN_x4plus_anime_6B':
         model = RRDBNet(num_in_ch=3, num_out_ch=3, num_feat=64, num_block=6, num_grow_ch=32, scale=4)
         netscale = 4
@@ -28,22 +25,18 @@ def get_upsampler(model_name='realesr-general-x4v3'):
         model = SRVGGNetCompact(num_in_ch=3, num_out_ch=3, num_feat=64, num_conv=32, upscale=4, act_type='prelu')
         netscale = 4
         file_url = 'https://github.com/xinntao/Real-ESRGAN/releases/download/v0.2.5.0/realesr-general-x4v3.pth'
     model_path = load_file_from_url(url=file_url, model_dir='weights', progress=True)
     upsampler = RealESRGANer(
         scale=netscale, model_path=model_path, model=model,
-        tile=64, tile_pad=10, pre_pad=10, half=True, gpu_id=None # Use half precision for speed
     )
     model_cache[model_name] = upsampler
     return upsampler
 def get_face_enhancer(upsampler, outscale):
-    """Loads and returns the GFPGAN face enhancer."""
     key = f'face_enhancer_{outscale}'
     if key in model_cache:
         return model_cache[key]
     face_enhancer = GFPGANer(
         model_path='https://github.com/TencentARC/GFPGAN/releases/download/v1.3.0/GFPGANv1.3.pth',
         upscale=outscale, arch='clean', channel_multiplier=2, bg_upsampler=upsampler
@@ -51,102 +44,76 @@ def get_face_enhancer(upsampler, outscale):
     model_cache[key] = face_enhancer
     return face_enhancer
-# --- Core Video Processing Function ---
 def enhance_video(video_path, model_name, outscale, face_enhance, progress=gr.Progress(track_tqdm=True)):
-    """Enhances a video frame by frame and provides progress updates."""
     if not video_path:
         raise gr.Error("Please upload a video to enhance.")
     try:
         upsampler = get_upsampler(model_name)
         face_enhancer = None
         if face_enhance:
             face_enhancer = get_face_enhancer(upsampler, outscale)
         cap = cv2.VideoCapture(video_path)
-        fps = cap.get(cv.CAP_PROP_FPS)
-        width = int(cap.get(cv.CAP_PROP_FRAME_WIDTH))
-        height = int(cap.get(cv.CAP_PROP_FRAME_HEIGHT))
-        total_frames = int(cap.get(cv.CAP_PROP_FRAME_COUNT))
-        # Prepare output video writer
         temp_dir = tempfile.mkdtemp()
         enhanced_video_path = os.path.join(temp_dir, "enhanced_video.mp4")
         fourcc = cv2.VideoWriter_fourcc(*'mp4v')
         writer = cv2.VideoWriter(enhanced_video_path, fourcc, fps, (width * outscale, height * outscale))
-        # Process each frame
         for _ in progress.tqdm(range(total_frames), desc="Enhancing Frames..."):
             ret, frame = cap.read()
-            if not ret:
-                break
             if face_enhancer:
                 _, _, enhanced_frame = face_enhancer.enhance(frame, has_aligned=False, only_center_face=False, paste_back=True)
             else:
                 enhanced_frame, _ = upsampler.enhance(frame, outscale=outscale)
             writer.write(enhanced_frame)
         cap.release()
         writer.release()
-        # Merge audio back into the enhanced video
         final_output_path = os.path.join(temp_dir, "final_output_with_audio.mp4")
         audio_merge_cmd = f'ffmpeg -y -i "{enhanced_video_path}" -i "{video_path}" -c:v libx264 -crf 23 -preset fast -c:a aac -b:a 128k -map 0:v:0 -map 1:a:0 -shortest "{final_output_path}"'
         subprocess.call(audio_merge_cmd, shell=True, stderr=subprocess.DEVNULL, stdout=subprocess.DEVNULL)
         return final_output_path
     except Exception as e:
         print(traceback.format_exc())
         raise gr.Error(f"An error occurred: {e}")
-# --- Gradio UI with Modern Design ---
 with gr.Blocks(theme=gr.themes.Soft(primary_hue="violet"), title="🎥 AI Video Enhancer") as demo:
     gr.Markdown(
         """
-        # 🎥 AI Video Enhancer & Upscaler
-        Improve video quality, upscale resolution, and restore faces with cutting-edge AI.
-        **Note:** Processing can be slow, especially for longer videos.
         """
     )
-    # Top row for video previews
-    with gr.Row():
-        video_input = gr.Video(label="🎬 Original Video")
-        video_output = gr.Video(label="🌟 Enhanced Result")
-    # Panel for all settings and actions
-    with gr.Box():
-        with gr.Row():
-            # Left side for main settings
-            with gr.Column(scale=3):
                 model_name = gr.Dropdown(
                     choices=["realesr-general-x4v3", "RealESRGAN_x4plus_anime_6B"],
                     value="realesr-general-x4v3",
                     label="Model Type (General or Anime)"
                 )
                 outscale = gr.Slider(1, 4, value=2, step=1, label="Upscale Factor")
-            # Right side for the most important actions
-            with gr.Column(scale=1, min_width=200):
-                face_enhance = gr.Checkbox(label="✨ Restore Faces (GFPGAN)", value=False)
-                enhance_btn = gr.Button("🚀 Enhance Video", variant="primary")
-    # Examples and Download components
-    gr.Examples(
-        examples=["sample_video.mp4"], # Add path to your example video
-        inputs=[video_input],
-        label="Click an example to start"
-    )
-    download_file = gr.File(label="⬇️ Download Enhanced Video", visible=False)
-    # --- Event Logic ---
     def on_submit(video, model, scale, face):
-        # When the button is clicked, start the enhancement and return the path to the output video.
-        # Also, make the download button visible.
         output_path = enhance_video(video, model, scale, face)
         return output_path, gr.update(value=output_path, visible=True)

 from gfpgan import GFPGANer
 from basicsr.utils.download_util import load_file_from_url
+# --- Model Loading (Unchanged) ---
 model_cache = {}
 def get_upsampler(model_name='realesr-general-x4v3'):
     if model_name in model_cache:
         return model_cache[model_name]
     if model_name == 'RealESRGAN_x4plus_anime_6B':
         model = RRDBNet(num_in_ch=3, num_out_ch=3, num_feat=64, num_block=6, num_grow_ch=32, scale=4)
         netscale = 4
         model = SRVGGNetCompact(num_in_ch=3, num_out_ch=3, num_feat=64, num_conv=32, upscale=4, act_type='prelu')
         netscale = 4
         file_url = 'https://github.com/xinntao/Real-ESRGAN/releases/download/v0.2.5.0/realesr-general-x4v3.pth'
     model_path = load_file_from_url(url=file_url, model_dir='weights', progress=True)
     upsampler = RealESRGANer(
         scale=netscale, model_path=model_path, model=model,
+        tile=64, tile_pad=10, pre_pad=10, half=True, gpu_id=None
     )
     model_cache[model_name] = upsampler
     return upsampler
 def get_face_enhancer(upsampler, outscale):
     key = f'face_enhancer_{outscale}'
     if key in model_cache:
         return model_cache[key]
     face_enhancer = GFPGANer(
         model_path='https://github.com/TencentARC/GFPGAN/releases/download/v1.3.0/GFPGANv1.3.pth',
         upscale=outscale, arch='clean', channel_multiplier=2, bg_upsampler=upsampler
     model_cache[key] = face_enhancer
     return face_enhancer
+# --- Core Video Processing Function (Unchanged) ---
 def enhance_video(video_path, model_name, outscale, face_enhance, progress=gr.Progress(track_tqdm=True)):
     if not video_path:
         raise gr.Error("Please upload a video to enhance.")
     try:
         upsampler = get_upsampler(model_name)
         face_enhancer = None
         if face_enhance:
             face_enhancer = get_face_enhancer(upsampler, outscale)
         cap = cv2.VideoCapture(video_path)
+        fps = cap.get(cv2.CAP_PROP_FPS)
+        width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
+        height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
+        total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
         temp_dir = tempfile.mkdtemp()
         enhanced_video_path = os.path.join(temp_dir, "enhanced_video.mp4")
         fourcc = cv2.VideoWriter_fourcc(*'mp4v')
         writer = cv2.VideoWriter(enhanced_video_path, fourcc, fps, (width * outscale, height * outscale))
         for _ in progress.tqdm(range(total_frames), desc="Enhancing Frames..."):
             ret, frame = cap.read()
+            if not ret: break
             if face_enhancer:
                 _, _, enhanced_frame = face_enhancer.enhance(frame, has_aligned=False, only_center_face=False, paste_back=True)
             else:
                 enhanced_frame, _ = upsampler.enhance(frame, outscale=outscale)
             writer.write(enhanced_frame)
         cap.release()
         writer.release()
         final_output_path = os.path.join(temp_dir, "final_output_with_audio.mp4")
         audio_merge_cmd = f'ffmpeg -y -i "{enhanced_video_path}" -i "{video_path}" -c:v libx264 -crf 23 -preset fast -c:a aac -b:a 128k -map 0:v:0 -map 1:a:0 -shortest "{final_output_path}"'
         subprocess.call(audio_merge_cmd, shell=True, stderr=subprocess.DEVNULL, stdout=subprocess.DEVNULL)
         return final_output_path
     except Exception as e:
         print(traceback.format_exc())
         raise gr.Error(f"An error occurred: {e}")
+# --- Gradio UI with Corrected Layout ---
 with gr.Blocks(theme=gr.themes.Soft(primary_hue="violet"), title="🎥 AI Video Enhancer") as demo:
     gr.Markdown(
         """
+        Improve video quality, upscale resolution, and restore faces with cutting-edge AI.
         """
     )
+    # Main two-column layout
+    with gr.Row(variant="panel"):
+        # --- Input Column on the Left ---
+        with gr.Column(scale=1):
+            video_input = gr.Video(label="🎬 Upload Your Video")
+            # Accordion for less frequently used settings
+            with gr.Accordion("Advanced Options", open=False):
                 model_name = gr.Dropdown(
                     choices=["realesr-general-x4v3", "RealESRGAN_x4plus_anime_6B"],
                     value="realesr-general-x4v3",
                     label="Model Type (General or Anime)"
                 )
                 outscale = gr.Slider(1, 4, value=2, step=1, label="Upscale Factor")
+        # --- Output Column on the Right ---
+        with gr.Column(scale=1):
+            video_output = gr.Video(label="🌟 Enhanced Result")
+            # ✅ FIX: Controls are now placed directly under the output video
+            face_enhance = gr.Checkbox(label="✨ Restore Faces (GFPGAN)", value=False, elem_id="face-enhance-checkbox")
+            enhance_btn = gr.Button("🚀 Enhance Video", variant="primary")
+            download_file = gr.File(label="⬇️ Download Enhanced Video", visible=False)
+    # --- Event Logic (Unchanged) ---
     def on_submit(video, model, scale, face):
         output_path = enhance_video(video, model, scale, face)
         return output_path, gr.update(value=output_path, visible=True)