ace-1
/

bert-donation-classifier

Model card Files Files and versions

ace-1 commited on Jul 8, 2025

Commit

cef3e59

·

verified ·

1 Parent(s): e890fdc

Upload handler.py

Files changed (1) hide show

handler.py +60 -16

handler.py CHANGED Viewed

@@ -1,18 +1,62 @@
-from typing import Dict, List, Any
-from transformers import pipeline
 class EndpointHandler:
-    def __init__(self, path=""):
-        # Load the model and tokenizer at startup
-        self.classifier = pipeline("text-classification", model=path if path else None)
-    def preprocess(self, inputs: Dict[str, Any]) -> List[str]:
-        # Hugging Face Inference API sends {"inputs": ...}
-        if isinstance(inputs["inputs"], list):
-            return inputs["inputs"]
-        return [inputs["inputs"]]
-    def __call__(self, inputs: Dict[str, Any]) -> List[Dict[str, Any]]:
-        texts = self.preprocess(inputs)
-        results = self.classifier(texts)
-        return results

+from typing import Dict, Any, List, Union
+from transformers import (
+    AutoTokenizer,
+    AutoModelForSequenceClassification,
+    TextClassificationPipeline,
+)
 class EndpointHandler:
+    """Custom handler for Hugging Face Inference Endpoints.
+    Loads a fine-tuned text-classification model and exposes a callable
+    that the endpoint runtime will invoke. The runtime will instantiate
+    this class once at startup, passing the model directory path.
+    """
+    def __init__(self, path: str = "", **kwargs):
+        # `path` is the directory where the model artefacts are stored.
+        # Fallback to current directory if not provided (local testing).
+        model_dir = path or "."
+        # Load tokenizer & model
+        self.tokenizer = AutoTokenizer.from_pretrained(model_dir, use_fast=True)
+        self.model = AutoModelForSequenceClassification.from_pretrained(model_dir)
+        # Build a text-classification pipeline
+        self.pipeline = TextClassificationPipeline(
+            model=self.model,
+            tokenizer=self.tokenizer,
+            device=-1,  # CPU; the runtime sets CUDA if available automatically
+            return_all_scores=False,
+            function_to_apply="sigmoid"
+            if getattr(self.model.config, "problem_type", None)
+            == "multi_label_classification"
+            else "softmax",
+        )
+    def __call__(self, data: Dict[str, Any]) -> Union[Dict[str, Any], List[Dict[str, Any]]]:
+        """Run inference on the incoming request.
+        Expected input format from the Inference Endpoint runtime:
+            {
+              "inputs": "some text" | ["text 1", "text 2", ...],
+              "parameters": { ... }  # optional pipeline kwargs (e.g., top_k)
+            }
+        """
+        # Extract the text(s)
+        raw_inputs = data.get("inputs", data)
+        if isinstance(raw_inputs, str):
+            raw_inputs = [raw_inputs]
+        # Additional pipeline parameters (optional)
+        parameters = data.get("parameters", {})
+        # Execute the pipeline
+        outputs = self.pipeline(raw_inputs, **parameters)
+        # If only one input was provided, return a single dict for convenience
+        if len(outputs) == 1:
+            return outputs[0]
+        return outputs