Spaces:

lucky0146
/

CodeFormer

Runtime error

App Files Files Community

lucky0146 commited on Mar 9, 2025

Commit

1a1e1ca

verified ·

1 Parent(s): 59aebcf

Create app.py

Browse files

Files changed (1) hide show

app.py +135 -0

app.py ADDED Viewed

	@@ -0,0 +1,135 @@

+import os
+import sys
+import gradio as gr
+import torch
+import cv2
+import numpy as np
+from PIL import Image
+import urllib.request
+import tarfile
+# Function to download a file from a URL
+def download_file(url, dest):
+    if not os.path.exists(dest):
+        os.makedirs(os.path.dirname(dest), exist_ok=True)
+        urllib.request.urlretrieve(url, dest)
+        print(f"Downloaded {dest}")
+# Download pretrained model and necessary files
+def setup_environment():
+    # Download CodeFormer pretrained model
+    model_url = "https://github.com/sczhou/CodeFormer/releases/download/v0.1.0/codeformer.pth"
+    model_path = "weights/codeformer.pth"
+    download_file(model_url, model_path)
+    # Download facexlib detection models (needed for face detection)
+    retinaface_url = "https://github.com/xinntao/facexlib/releases/download/v0.1.0/detection_Resnet50_Final.pth"
+    retinaface_path = "weights/detection_Resnet50_Final.pth"
+    download_file(retinaface_url, retinaface_path)
+# Define a simplified CodeFormer architecture (instead of downloading codeformer_arch.py)
+class CodeFormer(torch.nn.Module):
+    def __init__(self, dim_embd=512, codebook_size=1024, n_head=8, n_layer=9, connect_list=['32', '64', '128', '256']):
+        super(CodeFormer, self).__init__()
+        # This is a simplified placeholder. In practice, you'd need the full architecture.
+        self.encoder = torch.nn.Sequential(
+            torch.nn.Conv2d(3, dim_embd, kernel_size=3, stride=1, padding=1),
+            torch.nn.ReLU(),
+            torch.nn.Conv2d(dim_embd, dim_embd, kernel_size=3, stride=1, padding=1)
+        )
+        self.decoder = torch.nn.Sequential(
+            torch.nn.ConvTranspose2d(dim_embd, 3, kernel_size=3, stride=1, padding=1),
+            torch.nn.Sigmoid()
+        )
+        # Note: This is a mock implementation. Full CodeFormer requires the actual codeformer_arch.py.
+    def forward(self, x, w=0.5, adain=True):
+        # Simplified forward pass (placeholder)
+        enc = self.encoder(x)
+        dec = self.decoder(enc)
+        return dec
+# Load CodeFormer model
+def load_codeformer():
+    setup_environment()
+    model_path = "weights/codeformer.pth"
+    net = CodeFormer().to('cpu')
+    checkpoint = torch.load(model_path, map_location='cpu')
+    net.load_state_dict(checkpoint, strict=False)  # strict=False due to simplified architecture
+    net.eval()
+    return net
+# Image processing utilities (mimicking basicsr.utils)
+def img2tensor(img, bgr2rgb=True, float32=True):
+    if bgr2rgb:
+        img = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
+    img = torch.from_numpy(img.transpose(2, 0, 1)).float()
+    if float32:
+        img = img / 255.0
+    return img
+def tensor2img(tensor, rgb2bgr=True, min_max=(-1, 1)):
+    tensor = tensor.squeeze().float().cpu().clamp_(*min_max)
+    tensor = (tensor - min_max[0]) / (min_max[1] - min_max[0]) * 255.0
+    img = tensor.numpy().transpose(1, 2, 0).astype(np.uint8)
+    if rgb2bgr:
+        img = cv2.cvtColor(img, cv2.COLOR_RGB2BGR)
+    return img
+# Inference function
+def enhance_image(image, fidelity_weight=0.5):
+    from facexlib.utils.face_restoration_helper import FaceRestoreHelper
+    # Load model
+    net = load_codeformer()
+    # Convert PIL image to OpenCV format
+    img = np.array(image)
+    img = cv2.cvtColor(img, cv2.COLOR_RGB2BGR)
+    # Initialize face helper
+    face_helper = FaceRestoreHelper(upscale_factor=1, face_size=512, crop_ratio=(1, 1), det_model='retinaface_resnet50', save_ext='png', device='cpu')
+    face_helper.clean_all()
+    face_helper.read_image(img)
+    face_helper.get_face_landmarks_5(align=True)
+    face_helper.align_warp_face()
+    # Enhance face with CodeFormer
+    for cropped_face in face_helper.cropped_faces:
+        cropped_face_t = img2tensor(cropped_face, bgr2rgb=True, float32=True)
+        with torch.no_grad():
+            output = net(cropped_face_t.unsqueeze(0), w=fidelity_weight, adain=True)[0]
+        restored_face = tensor2img(output, rgb2bgr=True, min_max=(-1, 1))
+        restored_face = restored_face.astype('uint8')
+        face_helper.add_restored_face(restored_face)
+    # Get final restored image
+    face_helper.get_inverse_affine(None)
+    restored_img = face_helper.paste_faces_to_input_image()
+    # Convert back to PIL for Gradio
+    restored_img = cv2.cvtColor(restored_img, cv2.COLOR_BGR2RGB)
+    return Image.fromarray(restored_img)
+# Gradio interface
+with gr.Blocks() as demo:
+    gr.Markdown("# CodeFormer Face Restoration (CPU)")
+    gr.Markdown("Upload an image to enhance faces using CodeFormer. Runs on CPU in Hugging Face Spaces.")
+    with gr.Row():
+        input_image = gr.Image(type="pil", label="Input Image")
+        output_image = gr.Image(type="pil", label="Enhanced Image")
+    fidelity_slider = gr.Slider(0, 1, value=0.5, step=0.1, label="Fidelity Weight (0 = more restoration, 1 = more original)")
+    submit_btn = gr.Button("Enhance")
+    submit_btn.click(
+        fn=enhance_image,
+        inputs=[input_image, fidelity_slider],
+        outputs=output_image
+    )
+if __name__ == "__main__":
+    # Ensure setup runs once
+    setup_environment()
+    demo.launch()