Spaces:

lucky0146
/

CodeFormer

Runtime error

App Files Files Community

lucky0146 commited on Apr 5, 2025

Commit

ba71866

verified ·

1 Parent(s): d4e25e7

Update app.py

Browse files

Files changed (1) hide show

app.py +170 -131

app.py CHANGED Viewed

@@ -1,137 +1,176 @@
-import os
-import sys
 import gradio as gr
 import torch
 import cv2
 import numpy as np
-from PIL import Image
-import urllib.request
-from facexlib.utils.face_restoration_helper import FaceRestoreHelper
-from codeformer_arch import CodeFormer
-# Function to download a file from a URL
-def download_file(url, dest):
-    if not os.path.exists(dest):
-        os.makedirs(os.path.dirname(dest), exist_ok=True)
-        urllib.request.urlretrieve(url, dest)
-        print(f"Downloaded {dest}")
-# Download pretrained models
-def setup_environment():
-    # Download CodeFormer pretrained model
-    model_url = "https://github.com/sczhou/CodeFormer/releases/download/v0.1.0/codeformer.pth"
-    model_path = "weights/CodeFormer/codeformer.pth"
-    download_file(model_url, model_path)
-    # Download facelib model (for face detection)
-    facelib_url = "https://github.com/xinntao/facexlib/releases/download/v0.1.0/detection_Resnet50_Final.pth"
-    facelib_path = "weights/facelib/detection_Resnet50_Final.pth"
-    download_file(facelib_url, facelib_path)
-    # Download Real-ESRGAN model for background upsampling (optional)
-    realesrgan_url = "https://github.com/xinntao/Real-ESRGAN/releases/download/v0.1.0/RealESRGAN_x4plus.pth"
-    realesrgan_path = "weights/realesrgan/RealESRGAN_x4plus.pth"
-    download_file(realesrgan_url, realesrgan_path)
-# Load CodeFormer model
-def load_codeformer():
-    setup_environment()
-    model = CodeFormer(dim_embd=512, codebook_size=1024, n_head=8, n_layers=9, connect_list=['32', '64', '128', '256'])
-    # Load the state dict, extracting the 'params_ema' key
-    checkpoint = torch.load("weights/CodeFormer/codeformer.pth", map_location='cpu')
-    state_dict = checkpoint['params_ema'] if 'params_ema' in checkpoint else checkpoint
-    model.load_state_dict(state_dict, strict=False)  # Use strict=False to ignore missing keys
-    model.eval()
-    model = model.to('cpu')  # Force CPU
-    return model
-# Image processing utilities (mimicking basicsr.utils)
-def img2tensor(img, bgr2rgb=True, float32=True):
-    if bgr2rgb:
-        img = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
-    img = torch.from_numpy(img.transpose(2, 0, 1)).float()
-    if float32:
-        img = img / 255.0
-    return img
-def tensor2img(tensor, rgb2bgr=True, min_max=(-1, 1)):
-    tensor = tensor.squeeze().float().cpu().clamp_(*min_max)
-    tensor = (tensor - min_max[0]) / (min_max[1] - min_max[0]) * 255.0
-    img = tensor.numpy().transpose(1, 2, 0).astype(np.uint8)
-    if rgb2bgr:
-        img = cv2.cvtColor(img, cv2.COLOR_RGB2BGR)
-    return img
-# Inference function
-def enhance_image(input_image, fidelity_weight=0.5, background_enhance=True, face_upsample=False):
-    # Convert PIL image to OpenCV format
-    img = np.array(input_image)
-    img = cv2.cvtColor(img, cv2.COLOR_RGB2BGR)
-    # Initialize face helper
-    face_helper = FaceRestoreHelper(
-        upscale_factor=1 if not face_upsample else 2,
-        face_size=512,
-        crop_ratio=(1, 1),
-        det_model='retinaface_resnet50',
-        save_ext='png',
-        device='cpu'
-    )
-    face_helper.clean_all()
-    face_helper.read_image(img)
-    face_helper.get_face_landmarks_5()
-    face_helper.align_warp_face()
-    # Load CodeFormer model
-    net = load_codeformer()
-    # Enhance face
-    for cropped_face in face_helper.cropped_faces:
-        cropped_face_t = img2tensor(cropped_face, bgr2rgb=True, float32=True)
         with torch.no_grad():
-            output = net(cropped_face_t.unsqueeze(0), w=fidelity_weight, adain=True)[0]
-        restored_face = tensor2img(output, rgb2bgr=True, min_max=(-1, 1))
-        restored_face = restored_face.astype('uint8')
-        face_helper.add_restored_face(restored_face)
-    # Get restored image
-    face_helper.get_inverse_affine(None)
-    restored_img = face_helper.paste_faces_to_input_image()
-    # Background enhancement with Real-ESRGAN (optional)
-    if background_enhance:
-        from realesrgan import RealESRGANer
-        upsampler = RealESRGANer(
-            scale=4,
-            model_path="weights/realesrgan/RealESRGAN_x4plus.pth",
-            device='cpu'
-        )
-        restored_img, _ = upsampler.enhance(restored_img, outscale=4)
-    # Convert back to PIL for Gradio
-    restored_img = cv2.cvtColor(restored_img, cv2.COLOR_BGR2RGB)
-    return Image.fromarray(restored_img)
-# Gradio interface
-with gr.Blocks() as demo:
-    gr.Markdown("# CodeFormer Face Restoration (CPU)")
-    gr.Markdown("Upload an image to enhance faces using CodeFormer. Runs on CPU in Hugging Face Spaces.")
-    with gr.Row():
-        input_image = gr.Image(type="pil", label="Input Image")
-        output_image = gr.Image(type="pil", label="Enhanced Image")
-    fidelity_slider = gr.Slider(0, 1, value=0.5, step=0.01, label="Fidelity Weight (0 = more restoration, 1 = more original)")
-    background_enhance = gr.Checkbox(label="Enhance Background (Real-ESRGAN)", value=True)
-    face_upsample = gr.Checkbox(label="Upsample Restored Faces", value=False)
-    submit_btn = gr.Button("Enhance")
-    submit_btn.click(
-        fn=enhance_image,
-        inputs=[input_image, fidelity_slider, background_enhance, face_upsample],
-        outputs=output_image
-    )
 if __name__ == "__main__":
-    setup_environment()
-    demo.launch()

 import gradio as gr
 import torch
 import cv2
 import numpy as np
+import os
+import time
+import warnings
+# Suppress specific warnings or all warnings if needed
+warnings.filterwarnings("ignore")
+# Try importing CodeFormer, handle potential import errors
+try:
+    from codeformer import CodeFormer
+except ImportError:
+    print("Error: CodeFormer not found. Make sure it's installed correctly (check requirements.txt).")
+    # Optionally, try adding the repo path if cloned (more complex setup)
+    # sys.path.append('CodeFormer') # If you cloned the repo into a folder named CodeFormer
+    # from basicsr.utils.registry import ARCH_REGISTRY
+    raise
+print("Imports successful.")
+# --- Configuration ---
+# Automatically select CPU
+device = torch.device("cpu")
+print(f"Using device: {device}")
+# Initialize CodeFormer - Model weights will be downloaded automatically on first run
+# Ensure you have internet access in the Space for the download.
+print("Initializing CodeFormer model...")
+try:
+    # Adjust model path if needed, but pretrained=True should handle downloads
+    # Check the documentation for the 'codeformer' package if this fails.
+    # Common parameters: bg_upsampler='realesrgan', face_upsample=True
+    codeformer_net = CodeFormer(
+        dim_embd=512,
+        codebook_size=1024,
+        n_head=8,
+        n_layers=9,
+        connect_list=['32', '64', '128', '256']
+    ).to(device)
+    # Load the pre-trained model weights
+    # Adjust the path based on how the package stores weights or if downloaded manually
+    # This path assumes the standard download location used by `load_state_dict_from_url`
+    # It might differ based on the specific 'codeformer' pip package version.
+    # If this fails, check where the package downloads/expects the .pth file.
+    model_path = 'weights/CodeFormer/codeformer.pth' # Default path often used
+    # Check if the default path exists, otherwise rely on package's internal loading if possible
+    # A robust package might have a load_pretrained() method. Check its usage.
+    # This explicit loading might be needed if the package is minimal.
+    # Let's assume the package handles loading implicitly or requires a different call.
+    # Simpler approach: Rely on package potentially loading during init or a specific method.
+    # If the above CodeFormer() init doesn't load weights, check package docs.
+    # For now, let's assume the package *might* need explicit loading IF NOT BUILT-IN:
+    # Placeholder checkpoint loading - adjust based on actual package behavior
+    # This might be automatically handled by the package; if the app fails here,
+    # investigate how the specific `codeformer` pip package loads weights.
+    try:
+        # Example: Load weights/CodeFormer/codeformer.pth
+        # This path needs to be correct relative to where HF downloads/caches it, or package internal path
+        # It's often complex to pinpoint the exact cache location in HF Spaces
+        # A safer bet is often using a model hub integration if available, or ensuring the package handles it well.
+        # For now, we'll *assume* the package loads weights correctly or fails gracefully if not found
+        # checkpoint = torch.load(model_path)['params_ema']
+        # codeformer_net.load_state_dict(checkpoint)
+        print("Model weights assumed to be loaded by package or implicitly.") # Placeholder message
+    except FileNotFoundError:
+         print(f"Warning: Pretrained weights not found at default path '{model_path}'. Relying on package's internal loading mechanism if available.")
+    except Exception as e:
+         print(f"Error loading weights explicitly: {e}. Relying on package's internal loading.")
+    codeformer_net.eval()
+    print("CodeFormer model initialized successfully.")
+except Exception as e:
+    print(f"Error initializing CodeFormer model: {e}")
+    # Provide helpful error message in the UI if initialization fails
+    gr.Error(f"Failed to load CodeFormer model. Check logs. Error: {e}")
+    codeformer_net = None # Set to None to prevent processing attempts
+# --- Processing Function ---
+def enhance_image(input_img, fidelity_weight, background_enhance, face_upsample):
+    """
+    Enhances the input image using CodeFormer.
+    Args:
+        input_img (np.ndarray): Input image from Gradio (RGB format).
+        fidelity_weight (float): Balances fidelity and quality (0 = best quality, 1 = best fidelity).
+        background_enhance (bool): Whether to enhance background using RealESRGAN.
+        face_upsample (bool): Whether to further upsample restored faces.
+    Returns:
+        np.ndarray: Enhanced image (RGB format).
+        str: Processing time message.
+    """
+    if codeformer_net is None:
+        return None, "Error: CodeFormer model not loaded."
+    if input_img is None:
+        return None, "Error: No input image provided."
+    print(f"Processing image with fidelity: {fidelity_weight}, bg_enhance: {background_enhance}, face_upsample: {face_upsample}")
+    start_time = time.time()
+    try:
+        # Gradio provides RGB, CodeFormer often expects BGR internally via OpenCV
+        img_bgr = cv2.cvtColor(input_img, cv2.COLOR_RGB2BGR)
+        # Enhance the image - Use the correct method from the CodeFormer package
+        # The method might be called 'enhance', 'process', 'restore', etc.
+        # Check the package documentation for the exact API.
+        # Assuming a method like `codeformer_net.enhance(...)` or similar exists:
+        # The exact parameters (like `w`, `adain`) depend on the CodeFormer implementation.
+        # `w` typically corresponds to fidelity_weight.
         with torch.no_grad():
+            output_bgr, _, _ = codeformer_net.enhance(
+                img_bgr,
+                w=fidelity_weight,
+                adain=True, # Adain usually enabled
+                face_upsample=face_upsample,
+                bg_upsampler='realesrgan' if background_enhance else None # Use bg_upsampler if requested
+            )
+        # Convert back to RGB for Gradio display
+        output_rgb = cv2.cvtColor(output_bgr, cv2.COLOR_BGR2RGB)
+        end_time = time.time()
+        processing_time = end_time - start_time
+        time_msg = f"Processing finished in {processing_time:.2f} seconds (on CPU)."
+        print(time_msg)
+        return output_rgb, time_msg
+    except Exception as e:
+        print(f"Error during enhancement: {e}")
+        import traceback
+        traceback.print_exc()
+        return None, f"Error during processing: {e}"
+# --- Gradio Interface ---
+title = "CodeFormer Image Enhancement (CPU Demo)"
+description = """
+Upload an image to enhance its quality, particularly for faces, using CodeFormer.
+**Note:** This demo runs on a free Hugging Face CPU. Processing will be **SLOW** (expect seconds to minutes per image).
+Adjust the fidelity weight (0 = max quality enhancement, 1 = closer to original). Optionally enhance background and upsample faces.
+"""
+article = "<p style='text-align: center'>CodeFormer CPU Demo | <a href='https://github.com/sczhou/CodeFormer' target='_blank'>Official Repo</a></p>"
+iface = gr.Interface(
+    fn=enhance_image,
+    inputs=[
+        gr.Image(label="Upload Image", type="numpy"),
+        gr.Slider(minimum=0.0, maximum=1.0, step=0.05, value=0.7, label="Fidelity Weight (0 = Max Quality, 1 = Max Fidelity)"),
+        gr.Checkbox(label="Enhance Background (Uses RealESRGAN)", value=True),
+        gr.Checkbox(label="Upsample Restored Faces", value=True)
+    ],
+    outputs=[
+        gr.Image(label="Enhanced Image", type="numpy"),
+        gr.Textbox(label="Processing Time")
+    ],
+    title=title,
+    description=description,
+    article=article,
+    examples=[
+        ["examples/face1.png", 0.7, True, True], # Add example files to an 'examples' folder in your Space
+        ["examples/face2.png", 0.5, True, True],
+        ["examples/bg1.png", 0.8, True, False],
+    ],
+    allow_flagging="never" # Can change to "manual" or "auto" if needed
+)
+# --- Launch the App ---
 if __name__ == "__main__":
+    iface.launch()
+    print("Gradio app launched.")