Spaces:

ParamDev
/

spectraGAN

Running

File size: 10,573 Bytes

54d2540

"""
export_models.py
----------------
Downloads publicly available pretrained weights for SRCNN and EDSR (HResNet-style)
and exports them as ONNX files into the ./model/ directory.

Run once before starting app.py:
    pip install torch torchvision huggingface_hub basicsr
    python export_models.py

After this script finishes you should have:
    model/SRCNN_x4.onnx
    model/HResNet_x4.onnx

Then upload both files to Google Drive, copy the file IDs into DRIVE_IDS in app.py,
OR set LOCAL_ONLY = True below to skip Drive entirely and load straight from disk.
"""

import os
import torch
import torch.nn as nn
import torch.onnx
from pathlib import Path

MODEL_DIR = Path("model")
MODEL_DIR.mkdir(exist_ok=True)

# ---------------------------------------------------------------------------
# Set to True to skip Drive and have app.py load the ONNX files from disk
# directly.  In app.py, remove the download_from_drive call for these keys
# (or just leave the placeholder Drive ID — the script already guards against
# missing files gracefully).
# ---------------------------------------------------------------------------
LOCAL_ONLY = True   # flip to False once you have Drive IDs


# ===========================================================================
# 1. SRCNN  ×4
#    Architecture: Dong et al. 2014 — 3 conv layers, no upsampling inside
#    the network.  Input is bicubic-upscaled LR; output is the refined HR.
#    We bicubic-upsample inside a wrapper so the ONNX takes a raw LR image.
# ===========================================================================

class SRCNN(nn.Module):
    """Original SRCNN (Dong et al., 2014)."""
    def __init__(self, num_channels: int = 3):
        super().__init__()
        self.conv1 = nn.Conv2d(num_channels, 64,  kernel_size=9, padding=9 // 2)
        self.conv2 = nn.Conv2d(64,           32,  kernel_size=5, padding=5 // 2)
        self.conv3 = nn.Conv2d(32,           num_channels, kernel_size=5, padding=5 // 2)
        self.relu  = nn.ReLU(inplace=True)

    def forward(self, x: torch.Tensor) -> torch.Tensor:
        x = self.relu(self.conv1(x))
        x = self.relu(self.conv2(x))
        return self.conv3(x)


class SRCNNx4Wrapper(nn.Module):
    """
    Wraps SRCNN so the ONNX input is a LOW-resolution image.
    Internally bicubic-upsamples by ×4 before feeding SRCNN,
    matching the interface expected by app.py's tile_upscale_model.
    """
    def __init__(self, srcnn: SRCNN, scale: int = 4):
        super().__init__()
        self.srcnn = srcnn
        self.scale = scale

    def forward(self, x: torch.Tensor) -> torch.Tensor:
        # x: (1, 3, H, W) — low-res, float32 in [0, 1]
        up = torch.nn.functional.interpolate(
            x, scale_factor=self.scale, mode="bicubic", align_corners=False
        )
        return self.srcnn(up)


def build_srcnn_x4() -> nn.Module:
    """
    Loads pretrained SRCNN weights from the basicsr model zoo.
    Falls back to random init with a warning if download fails.
    """
    srcnn   = SRCNN(num_channels=3)
    wrapper = SRCNNx4Wrapper(srcnn, scale=4)

    # Pretrained weights from the basicsr / mmedit community
    # (original Caffe weights re-converted to PyTorch by https://github.com/yjn870/SRCNN-pytorch)
    SRCNN_WEIGHTS_URL = (
        "https://github.com/yjn870/SRCNN-pytorch/raw/master/models/"
        "srcnn_x4.pth"
    )
    weights_path = MODEL_DIR / "srcnn_x4.pth"

    if not weights_path.exists():
        print("  Downloading SRCNN ×4 weights …")
        try:
            import urllib.request
            urllib.request.urlretrieve(SRCNN_WEIGHTS_URL, weights_path)
            print(f"  Saved → {weights_path}")
        except Exception as e:
            print(f"  [WARN] Could not download SRCNN weights: {e}")
            print("  Continuing with random init (quality will be poor).")
            return wrapper

    state = torch.load(weights_path, map_location="cpu")
    # The yjn870 checkpoint uses keys conv1/conv2/conv3 matching our module
    try:
        srcnn.load_state_dict(state, strict=True)
        print("  SRCNN weights loaded ✓")
    except RuntimeError as e:
        print(f"  [WARN] Weight mismatch: {e}\n  Proceeding with partial load.")
        srcnn.load_state_dict(state, strict=False)

    return wrapper


# ===========================================================================
# 2. EDSR (HResNet-style)  ×4
#    EDSR-baseline (Lim et al., 2017) is the canonical "deep residual" SR
#    network.  Pretrained weights from eugenesiow/torch-sr (HuggingFace).
# ===========================================================================

class ResBlock(nn.Module):
    def __init__(self, n_feats: int, res_scale: float = 1.0):
        super().__init__()
        self.body = nn.Sequential(
            nn.Conv2d(n_feats, n_feats, 3, padding=1),
            nn.ReLU(inplace=True),
            nn.Conv2d(n_feats, n_feats, 3, padding=1),
        )
        self.res_scale = res_scale

    def forward(self, x):
        return x + self.body(x) * self.res_scale


class Upsampler(nn.Sequential):
    def __init__(self, scale: int, n_feats: int):
        layers = []
        if scale in (2, 4):
            steps = {2: 1, 4: 2}[scale]
            for _ in range(steps):
                layers += [
                    nn.Conv2d(n_feats, 4 * n_feats, 3, padding=1),
                    nn.PixelShuffle(2),
                ]
        elif scale == 3:
            layers += [
                nn.Conv2d(n_feats, 9 * n_feats, 3, padding=1),
                nn.PixelShuffle(3),
            ]
        super().__init__(*layers)


class EDSR(nn.Module):
    """
    EDSR-baseline: 16 residual blocks, 64 feature channels.
    Matches the publicly released weights from eugenesiow/torch-sr.
    """
    def __init__(self, n_resblocks: int = 16, n_feats: int = 64,
                 scale: int = 4, num_channels: int = 3):
        super().__init__()
        self.head = nn.Conv2d(num_channels, n_feats, 3, padding=1)
        self.body = nn.Sequential(*[ResBlock(n_feats) for _ in range(n_resblocks)])
        self.body_tail = nn.Conv2d(n_feats, n_feats, 3, padding=1)
        self.tail = nn.Sequential(
            Upsampler(scale, n_feats),
            nn.Conv2d(n_feats, num_channels, 3, padding=1),
        )

    def forward(self, x):
        x = self.head(x)
        res = self.body(x)
        res = self.body_tail(res)
        x = x + res
        return self.tail(x)


def build_edsr_x4() -> nn.Module:
    """
    Downloads EDSR-baseline ×4 weights and loads them.
    Source: eugenesiow/torch-sr (Apache-2.0 licensed).
    """
    model = EDSR(n_resblocks=16, n_feats=64, scale=4)

    # Direct link to the EDSR-baseline ×4 checkpoint
    EDSR_WEIGHTS_URL = (
        "https://huggingface.co/eugenesiow/edsr-base/resolve/main/"
        "pytorch_model_4x.pt"
    )
    weights_path = MODEL_DIR / "edsr_x4.pt"

    if not weights_path.exists():
        print("  Downloading EDSR ×4 weights from HuggingFace …")
        try:
            import urllib.request
            urllib.request.urlretrieve(EDSR_WEIGHTS_URL, weights_path)
            print(f"  Saved → {weights_path}")
        except Exception as e:
            print(f"  [WARN] Could not download EDSR weights: {e}")
            print("  Continuing with random init (quality will be poor).")
            return model

    state = torch.load(weights_path, map_location="cpu")

    # eugenesiow checkpoints may wrap state_dict under a 'model' key
    if "model" in state:
        state = state["model"]
    if "state_dict" in state:
        state = state["state_dict"]

    # Strip any 'module.' prefix from DataParallel wrapping
    state = {k.replace("module.", ""): v for k, v in state.items()}

    try:
        model.load_state_dict(state, strict=True)
        print("  EDSR weights loaded ✓")
    except RuntimeError as e:
        print(f"  [WARN] Weight mismatch ({e}). Trying strict=False …")
        model.load_state_dict(state, strict=False)
        print("  EDSR weights loaded (partial) ✓")

    return model


# ===========================================================================
# ONNX export helper
# ===========================================================================

def export_onnx(model: nn.Module, out_path: Path, tile_h: int = 128, tile_w: int = 128):
    """Export *model* to ONNX with dynamic H/W axes."""
    model.eval()
    dummy = torch.zeros(1, 3, tile_h, tile_w)
    torch.onnx.export(
        model,
        dummy,
        str(out_path),
        opset_version=17,
        input_names=["input"],
        output_names=["output"],
        dynamic_axes={
            "input":  {0: "batch", 2: "H", 3: "W"},
            "output": {0: "batch", 2: "H_out", 3: "W_out"},
        },
    )
    size_mb = out_path.stat().st_size / 1_048_576
    print(f"  Exported → {out_path}  ({size_mb:.1f} MB)")


# ===========================================================================
# Main
# ===========================================================================

if __name__ == "__main__":
    print("=" * 60)
    print("SpectraGAN — ONNX model exporter")
    print("=" * 60)

    # -- SRCNN ×4 ------------------------------------------------------------
    srcnn_out = MODEL_DIR / "SRCNN_x4.onnx"
    if srcnn_out.exists():
        print(f"\n[SKIP] {srcnn_out} already exists.")
    else:
        print("\n[1/2] Building SRCNN ×4 …")
        srcnn_model = build_srcnn_x4()
        print("  Exporting to ONNX …")
        export_onnx(srcnn_model, srcnn_out, tile_h=128, tile_w=128)

    # -- EDSR (HResNet) ×4 ---------------------------------------------------
    edsr_out = MODEL_DIR / "HResNet_x4.onnx"
    if edsr_out.exists():
        print(f"\n[SKIP] {edsr_out} already exists.")
    else:
        print("\n[2/2] Building EDSR (HResNet) ×4 …")
        edsr_model = build_edsr_x4()
        print("  Exporting to ONNX …")
        export_onnx(edsr_model, edsr_out, tile_h=128, tile_w=128)

    print("\n" + "=" * 60)
    print("Done!  Files created:")
    for p in [srcnn_out, edsr_out]:
        status = "✓" if p.exists() else "✗ MISSING"
        print(f"  {status}  {p}")
    print()

    if LOCAL_ONLY:
        print("LOCAL_ONLY = True:")
        print("  app.py will load these files directly from disk.")
        print("  No Google Drive upload needed.")
    else:
        print("Next step:")
        print("  Upload the .onnx files to Google Drive and paste")
        print("  the file IDs into DRIVE_IDS in app.py.")
    print("=" * 60)