testmobileclip

mobileclip

Model card Files Files and versions

xet

Community

finhdev commited on Aug 4, 2025

Commit

dc1caec

verified ·

1 Parent(s): 147df04

Update handler.py

Browse files

Files changed (1) hide show

handler.py +8 -85

handler.py CHANGED Viewed

@@ -1,20 +1,14 @@
-# handler.py  (repo root)
 import io, base64, torch
 from PIL import Image
 import open_clip
 class EndpointHandler:
     """
-    Zero‑shot classifier for MobileCLIP‑B (OpenCLIP).
-    Expected client JSON *to the endpoint*:
-    {
-      "inputs": {
-        "image": "<base64 PNG/JPEG>",
-        "candidate_labels": ["cat", "dog", ...]
-      }
-    }
     """
     def __init__(self, path: str = ""):
@@ -24,11 +18,15 @@ class EndpointHandler:
         )
         self.model.eval()
         self.tokenizer = open_clip.get_tokenizer("MobileCLIP-B")
         self.device = "cuda" if torch.cuda.is_available() else "cpu"
         self.model.to(self.device)
     def __call__(self, data):
         # ── unwrap Hugging Face's `inputs` envelope ───────────
         payload = data.get("inputs", data)
@@ -57,81 +55,6 @@ class EndpointHandler:
             {"label": l, "score": float(p)}
             for l, p in sorted(zip(labels, probs), key=lambda x: x[1], reverse=True)
         ]
-# import io, base64, torch
-# from PIL import Image
-# import open_clip
-# class EndpointHandler:
-#     """
-#     Zero‑shot classifier for MobileCLIP‑B (OpenCLIP) with a text‑embedding cache.
-#     Client JSON:
-#     {
-#       "inputs": {
-#         "image": "<base64 PNG/JPEG>",
-#         "candidate_labels": ["cat", "dog", ...]
-#       }
-#     }
-#     """
-#     # ------------------------------------------------- #
-#     #                 INITIALISATION                    #
-#     # ------------------------------------------------- #
-#     def __init__(self, path: str = ""):
-#         weights = f"{path}/mobileclip_b.pt"
-#         self.model, _, self.preprocess = open_clip.create_model_and_transforms(
-#             "MobileCLIP-B", pretrained=weights
-#         )
-#         self.model.eval()
-#         self.tokenizer = open_clip.get_tokenizer("MobileCLIP-B")
-#         self.device = "cuda" if torch.cuda.is_available() else "cpu"
-#         self.model.to(self.device)
-#         # cache: {prompt -> 1×512 tensor on device}
-#         self.label_cache: dict[str, torch.Tensor] = {}
-#     # ------------------------------------------------- #
-#     #                    INFERENCE                      #
-#     # ------------------------------------------------- #
-#     def __call__(self, data):
-#         payload = data.get("inputs", data)
-#         img_b64 = payload["image"]
-#         labels  = payload.get("candidate_labels", [])
-#         if not labels:
-#             return {"error": "candidate_labels list is empty"}
-#         # --- image ----
-#         image = Image.open(io.BytesIO(base64.b64decode(img_b64))).convert("RGB")
-#         img_tensor = self.preprocess(image).unsqueeze(0).to(self.device)
-#         # --- text (with cache) ----
-#         missing = [l for l in labels if l not in self.label_cache]
-#         if missing:
-#             tokens = self.tokenizer(missing).to(self.device)
-#             with torch.no_grad():
-#                 emb = self.model.encode_text(tokens)
-#                 emb = emb / emb.norm(dim=-1, keepdim=True)
-#             for l, e in zip(missing, emb):
-#                 self.label_cache[l] = e
-#         txt_feat = torch.stack([self.label_cache[l] for l in labels])
-#         # --- forward & softmax ----
-#         with torch.no_grad(), torch.cuda.amp.autocast():
-#             img_feat = self.model.encode_image(img_tensor)
-#             img_feat = img_feat / img_feat.norm(dim=-1, keepdim=True)
-#             probs = (100 * img_feat @ txt_feat.T).softmax(dim=-1)[0].tolist()
-#         # --- sorted output ----
-#         return [
-#             {"label": l, "score": float(p)}
-#             for l, p in sorted(zip(labels, probs), key=lambda x: x[1], reverse=True)
-#         ]
 # # handler.py  (repo root)
 # import io, base64, torch
 # from PIL import Image

 import io, base64, torch
 from PIL import Image
 import open_clip
+# Make sure the mobileclip library is installed in your Hugging Face environment
+# You might need to add it to your requirements.txt
+from mobileclip.modules.common.mobileone import reparameterize_model
 class EndpointHandler:
     """
+    Zero-shot classifier for MobileCLIP-B (OpenCLIP).
     """
     def __init__(self, path: str = ""):
         )
         self.model.eval()
+        # *** THIS IS THE CRUCIAL ADDITION ***
+        self.model = reparameterize_model(self.model)
         self.tokenizer = open_clip.get_tokenizer("MobileCLIP-B")
         self.device = "cuda" if torch.cuda.is_available() else "cpu"
         self.model.to(self.device)
     def __call__(self, data):
+        # ... (the rest of your __call__ method remains the same)
         # ── unwrap Hugging Face's `inputs` envelope ───────────
         payload = data.get("inputs", data)
             {"label": l, "score": float(p)}
             for l, p in sorted(zip(labels, probs), key=lambda x: x[1], reverse=True)
         ]
 # # handler.py  (repo root)
 # import io, base64, torch
 # from PIL import Image