Spaces:

mgbam
/

adaptive-sparse-training

Sleeping

App Files Files Community

mgbam commited on 1 day ago

Commit

e97ac39

verified ·

1 Parent(s): ce9678d

Update app.py

Browse files

Files changed (1) hide show

app.py +219 -44

app.py CHANGED Viewed

@@ -1,54 +1,229 @@
 import torch
-import torch.nn as nn
-from torchvision import models, transforms
-from torch.utils.data import DataLoader
 from PIL import Image
-import gradio as gr
 DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
-# Load class names (make sure this file is in the Space)
-with open("cifar10_classes.txt") as f:
-    CLASSES = [line.strip() for line in f.readlines()]
-def build_model(num_classes: int, device: str = "cpu"):
-    try:
-        weights = models.ResNet18_Weights.DEFAULT
-        model = models.resnet18(weights=weights)
-    except AttributeError:
-        model = models.resnet18(weights="IMAGENET1K_V1")
-    model.fc = nn.Linear(model.fc.in_features, num_classes)
-    model = model.to(device)
-    return model
-num_classes = len(CLASSES)
-model = build_model(num_classes, device=DEVICE)
-state_dict = torch.load("ast_cifar10_resnet18.pth", map_location=DEVICE)
-model.load_state_dict(state_dict)
-model.eval()
-preprocess = transforms.Compose([
-    transforms.Resize((224, 224)),
-    transforms.ToTensor(),
 ])
-def predict(image: Image.Image):
-    if image is None:
-        return {}
-    x = preprocess(image).unsqueeze(0).to(DEVICE)
-    with torch.no_grad():
-        logits = model(x)
-        probs = torch.softmax(logits, dim=1)[0]
-    return {CLASSES[i]: float(probs[i]) for i in range(len(CLASSES))}
-demo = gr.Interface(
-    fn=predict,
-    inputs=gr.Image(type="pil", label="Upload CIFAR-like image"),
-    outputs=gr.Label(num_top_classes=3, label="Top-3 Predictions"),
-    title="AST CIFAR-10 Classifier",
-    description="ResNet18 fine-tuned with Adaptive Sparse Training (AST) on CIFAR-10.",
-)
 if __name__ == "__main__":
     demo.launch()

+import os
+from pathlib import Path
+from typing import Optional, Tuple, Dict, List
+import gradio as gr
 import torch
+import torch.nn.functional as F
 from PIL import Image
+import torchvision.transforms as T
+from torchvision.models import resnet18
+# -----------------------------
+# Config
+# -----------------------------
+CIFAR10_CLASSES = [
+    "airplane","automobile","bird","cat","deer","dog","frog","horse","ship","truck"
+]
+# CIFAR-10 normalization (standard)
+CIFAR10_MEAN = (0.4914, 0.4822, 0.4465)
+CIFAR10_STD  = (0.2470, 0.2435, 0.2616)
+EXAMPLES_DIR = Path("Examples")  # you uploaded to this folder
 DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
+# -----------------------------
+# Utilities
+# -----------------------------
+def find_checkpoint(repo_root: Path) -> Optional[Path]:
+    """
+    Auto-find a checkpoint file in the repo.
+    Add your own filename here if you know it.
+    """
+    candidates = [
+        "model.pth", "model.pt",
+        "checkpoint.pth", "checkpoint.pt",
+        "best.pth", "best.pt",
+        "resnet18.pth", "resnet18.pt",
+        "weights.pth", "weights.pt",
+    ]
+    for name in candidates:
+        p = repo_root / name
+        if p.exists() and p.is_file():
+            return p
+    # Try pattern search
+    patterns = ["*.pth", "*.pt"]
+    for pat in patterns:
+        hits = sorted(repo_root.glob(pat))
+        # Prefer anything that looks like resnet/cifar/ast
+        preferred = [h for h in hits if any(k in h.name.lower() for k in ["resnet", "cifar", "ast", "sparse", "best"])]
+        if preferred:
+            return preferred[0]
+        if hits:
+            return hits[0]
+    return None
+def build_model(num_classes: int = 10) -> torch.nn.Module:
+    m = resnet18(weights=None)
+    m.fc = torch.nn.Linear(m.fc.in_features, num_classes)
+    return m
+def load_weights(model: torch.nn.Module, ckpt_path: Path) -> None:
+    """
+    Loads common checkpoint formats:
+    - plain state_dict
+    - dict with 'state_dict' or 'model' keys
+    """
+    ckpt = torch.load(ckpt_path, map_location="cpu")
+    if isinstance(ckpt, dict):
+        if "state_dict" in ckpt and isinstance(ckpt["state_dict"], dict):
+            state = ckpt["state_dict"]
+        elif "model" in ckpt and isinstance(ckpt["model"], dict):
+            state = ckpt["model"]
+        else:
+            # might already be a state_dict-like dict
+            state = ckpt
+    else:
+        raise ValueError(f"Unsupported checkpoint format: {type(ckpt)}")
+    # Strip possible 'module.' prefix if trained with DDP/DataParallel
+    new_state = {}
+    for k, v in state.items():
+        nk = k.replace("module.", "")
+        new_state[nk] = v
+    missing, unexpected = model.load_state_dict(new_state, strict=False)
+    # Strict=False to be robust; you can change to strict=True if you prefer.
+    if missing or unexpected:
+        print("[load_weights] Missing keys:", missing)
+        print("[load_weights] Unexpected keys:", unexpected)
+# -----------------------------
+# Preprocess + Predict
+# -----------------------------
+preprocess = T.Compose([
+    T.Resize((32, 32), interpolation=T.InterpolationMode.BILINEAR),
+    T.ToTensor(),
+    T.Normalize(mean=CIFAR10_MEAN, std=CIFAR10_STD),
 ])
+def pil_to_model_tensor(img: Image.Image) -> torch.Tensor:
+    img = img.convert("RGB")
+    x = preprocess(img).unsqueeze(0)  # [1,3,32,32]
+    return x
+def predict(img: Image.Image):
+    if img is None:
+        return None, None, None
+    if STATE["model"] is None:
+        raise gr.Error("Model is not loaded. Check that your checkpoint exists in the Space repo.")
+    # Show exactly what goes into the model (32x32)
+    img32 = img.convert("RGB").resize((32, 32), resample=Image.BILINEAR)
+    x = pil_to_model_tensor(img).to(DEVICE)
+    with torch.inference_mode():
+        logits = STATE["model"](x)
+        probs = F.softmax(logits, dim=1).squeeze(0)  # [10]
+    # Top-3
+    topk = torch.topk(probs, k=3)
+    top3 = [(CIFAR10_CLASSES[i], float(topk.values[j])) for j, i in enumerate(topk.indices.tolist())]
+    # Gradio Label expects dict label->confidence
+    label_dict = {cls: float(probs[i]) for i, cls in enumerate(CIFAR10_CLASSES)}
+    # Table for top-3
+    top3_table = [[name, f"{p*100:.2f}%"] for name, p in top3]
+    # Main prediction text
+    pred_name, pred_p = top3[0]
+    pred_text = f"**{pred_name}** ({pred_p*100:.2f}%)"
+    return img32, label_dict, top3_table, pred_text
+# -----------------------------
+# App state
+# -----------------------------
+STATE: Dict[str, Optional[torch.nn.Module]] = {"model": None}
+def init():
+    repo_root = Path(".")
+    ckpt = find_checkpoint(repo_root)
+    if ckpt is None:
+        print("[init] No checkpoint found in repo root.")
+        STATE["model"] = None
+        return
+    print(f"[init] Loading checkpoint: {ckpt}")
+    model = build_model(num_classes=len(CIFAR10_CLASSES))
+    load_weights(model, ckpt)
+    model.to(DEVICE).eval()
+    STATE["model"] = model
+def get_examples() -> List[List[str]]:
+    if not EXAMPLES_DIR.exists():
+        return []
+    imgs = sorted([p for p in EXAMPLES_DIR.iterdir() if p.suffix.lower() in [".png", ".jpg", ".jpeg"]])
+    # Gradio expects list of lists, each inner list corresponds to inputs
+    return [[str(p)] for p in imgs]
+init()
+EXAMPLES = get_examples()
+# -----------------------------
+# UI
+# -----------------------------
+with gr.Blocks(title="AST CIFAR-10 Classifier") as demo:
+    gr.Markdown(
+        "# AST CIFAR-10 Classifier\n"
+        "ResNet18 fine-tuned with Adaptive Sparse Training (AST) on CIFAR-10.\n\n"
+        f"**Device:** `{DEVICE}`"
+    )
+    with gr.Row():
+        with gr.Column(scale=1):
+            img_in = gr.Image(type="pil", label="Upload CIFAR-like image")
+            # Show the exact 32×32 fed to model (useful for debugging)
+            img_32 = gr.Image(type="pil", label="Model input (32×32)")
+        with gr.Column(scale=1):
+            gr.Markdown("### Top-3 Predictions")
+            pred_label = gr.Label(num_top_classes=3, label="Probabilities")
+            top3_table = gr.Dataframe(
+                headers=["class", "confidence"],
+                datatype=["str", "str"],
+                row_count=3,
+                col_count=(2, "fixed"),
+                interactive=False,
+                label="Top-3"
+            )
+            pred_text = gr.Markdown()
+    with gr.Row():
+        submit = gr.Button("Submit", variant="primary")
+        clear = gr.Button("Clear")
+    if EXAMPLES:
+        gr.Markdown("### Examples (from `Examples/` folder)")
+        gr.Examples(
+            examples=EXAMPLES,
+            inputs=[img_in],
+            cache_examples=True
+        )
+    submit.click(
+        fn=predict,
+        inputs=[img_in],
+        outputs=[img_32, pred_label, top3_table, pred_text]
+    )
+    def _clear():
+        return None, None, None, ""
+    clear.click(fn=_clear, inputs=[], outputs=[img_in, img_32, top3_table, pred_text])
+demo.queue()
 if __name__ == "__main__":
     demo.launch()