feat: Adds handler.py for inference endpoints

Browse files

Files changed (3) hide show

README.md +5 -0
handler.py +46 -0
requirements.txt +1 -0

README.md CHANGED Viewed

@@ -15,6 +15,11 @@ widget:
 - text: "George Washington ging nach Washington"
 ---
 ## 4-Language NER in Flair (English, German, Dutch and Spanish)
 This is the standard 4-class NER model for 4 CoNLL-03 languages that ships with [Flair](https://github.com/flairNLP/flair/). Also kind of works for related languages like French.

 - text: "George Washington ging nach Washington"
 ---
+# This is a fork of flair/ner-multi
+  As `flair/ner-multi` is missing a `handler.py`, this form implements a custom `handler.py` to be used with inference endpoints. The original model can be found here: [https://huggingface.co/flair/ner-multi](https://huggingface.co/flair/ner-multi)
 ## 4-Language NER in Flair (English, German, Dutch and Spanish)
 This is the standard 4-class NER model for 4 CoNLL-03 languages that ships with [Flair](https://github.com/flairNLP/flair/). Also kind of works for related languages like French.

handler.py ADDED Viewed

	@@ -0,0 +1,46 @@

+from typing import Any, Dict, List
+import os
+from flair.data import Sentence
+from flair.models import SequenceTagger
+class EndpointHandler():
+    def __init__(
+        self,
+        path: str,
+    ):
+        self.tagger = SequenceTagger.load(os.path.join(path,"pytorch_model.bin"))
+    def __call__(self, data: Dict[str, Any]) -> List[Dict[str, Any]]:
+        """
+        Args:
+            inputs (:obj:`str`):
+                a string containing some text
+        Return:
+            A :obj:`list`:. The object returned should be like [{"entity_group": "XXX", "word": "some word", "start": 3, "end": 6, "score": 0.82}] containing :
+                - "entity_group": A string representing what the entity is.
+                - "word": A substring of the original string that was detected as an entity.
+                - "start": the offset within `input` leading to `answer`. context[start:stop] == word
+                - "end": the ending offset within `input` leading to `answer`. context[start:stop] === word
+                - "score": A score between 0 and 1 describing how confident the model is for this entity.
+        """
+        inputs = data.pop("inputs", data)
+        sentence: Sentence = Sentence(inputs)
+        # Also show scores for recognized NEs
+        self.tagger.predict(sentence, label_name="predicted")
+        entities = []
+        for span in sentence.get_spans("predicted"):
+            if len(span.tokens) == 0:
+                continue
+            current_entity = {
+                "entity_group": span.tag,
+                "word": span.text,
+                "start": span.tokens[0].start_position,
+                "end": span.tokens[-1].end_position,
+                "score": span.score,
+            }
+            entities.append(current_entity)
+        return entities

requirements.txt ADDED Viewed

	@@ -0,0 +1 @@


1	+ flair==0.12.2