Ippoboi
/

minilmail-classifier

+"""
+Inference example for the MiniLM email classifier ONNX model.
+Usage:
+    pip install onnxruntime transformers
+    python example.py
+"""
+import numpy as np
+import onnxruntime as ort
+from transformers import AutoTokenizer
+CATEGORIES = ["ALERT", "NEWSLETTER", "PERSONAL", "SOCIAL", "TRANSACTION"]
+REPO_ID = "Ippoboi/minilmail-classifier"
+def classify_email(
+    session: ort.InferenceSession,
+    tokenizer: AutoTokenizer,
+    subject: str,
+    body: str,
+    action_threshold: float = 0.5,
+) -> dict:
+    """Classify an email and return category + action prediction."""
+    text = f"Subject: {subject}\n\nBody: {body}"
+    inputs = tokenizer(text, return_tensors="np", max_length=256, truncation=True)
+    cat_probs, act_prob = session.run(
+        ["category_probs", "action_prob"],
+        {
+            "input_ids": inputs["input_ids"].astype(np.int64),
+            "attention_mask": inputs["attention_mask"].astype(np.int64),
+            "token_type_ids": np.zeros_like(inputs["input_ids"], dtype=np.int64),
+        },
+    )
+    category_idx = int(np.argmax(cat_probs[0]))
+    return {
+        "category": CATEGORIES[category_idx],
+        "confidence": float(cat_probs[0][category_idx]),
+        "action_required": float(act_prob[0][0]) > action_threshold,
+        "action_probability": float(act_prob[0][0]),
+        "all_probabilities": {
+            cat: float(prob) for cat, prob in zip(CATEGORIES, cat_probs[0])
+        },
+    }
+def main():
+    from huggingface_hub import hf_hub_download
+    # Download model and tokenizer
+    model_path = hf_hub_download(REPO_ID, "model.onnx")
+    tokenizer = AutoTokenizer.from_pretrained(REPO_ID)
+    session = ort.InferenceSession(model_path)
+    # Example emails
+    emails = [
+        ("Your order has shipped", "Your order #12345 is on its way and will arrive by Monday."),
+        ("Meeting tomorrow", "Hey, can we reschedule our 2pm meeting to 3pm? Let me know."),
+        ("Weekly Newsletter", "Check out our latest deals! 50% off everything this weekend."),
+        ("Security Alert", "A new device logged into your account from San Francisco, CA."),
+        ("LinkedIn: New connection", "John Doe wants to connect with you on LinkedIn."),
+    ]
+    print("=" * 60)
+    print("MiniLM Email Classifier")
+    print("=" * 60)
+    for subject, body in emails:
+        result = classify_email(session, tokenizer, subject, body)
+        action = "ACTION" if result["action_required"] else "NO_ACTION"
+        print(f"\n  Subject: {subject}")
+        print(f"  → {result['category']} ({result['confidence']:.1%}) | {action} ({result['action_probability']:.1%})")
+if __name__ == "__main__":
+    main()