cguynup
/

flash_gen_bert_para

Model card Files Files and versions

cguynup commited on Nov 22, 2023

Commit

c5d740a

·

1 Parent(s): c0592b4

Update handler.py

Files changed (1) hide show

handler.py +15 -9

handler.py CHANGED Viewed

@@ -1,20 +1,26 @@
-from typing import  Dict, List, Any
-from optimum.onnxruntime import ORTModelForSequenceClassification
-from transformers import AutoTokenizer, pipeline
 class EndpointHandler():
     def __init__(self, path=""):
         # load the optimized model
-        model = ORTModelForSequenceClassification.from_pretrained(path)
-        tokenizer = AutoTokenizer.from_pretrained(path, do_lower_case=True)
         self.pipeline = pipeline("text-classification", model=model, tokenizer=tokenizer)
-    def __call__(self, data: Any) -> List[List[Dict[str, float]]]:
         inputs = data.pop("inputs", data)
-        prediction = self.pipeline(inputs, padding=True, truncation=True, max_length=253)
-        return prediction

+from transformers import DistilBertTokenizerFast, DistilBertForSequenceClassification, pipeline
 class EndpointHandler():
     def __init__(self, path=""):
         # load the optimized model
+        model = DistilBertForSequenceClassification.from_pretrained(path)
+        tokenizer = DistilBertTokenizerFast.from_pretrained(path, do_lower_case=True)
         self.pipeline = pipeline("text-classification", model=model, tokenizer=tokenizer)
+    def __call__(self, data):
         inputs = data.pop("inputs", data)
+        def iterator():
+            for i in inputs:
+                yield i
+        labels = []
+        for out in pipeline(iterator(), padding=True, truncation=True, max_length=253):
+            labels.append(int(out["label"][-1]))
+        return {
+            "pairs": inputs,
+            "evaluations": labels
+        }