canovich
/

myprivateee

Transformers

PyTorch

mt5

text2text-generation

Model card Files Files and versions

xet

canovich commited on Sep 14, 2022

Commit

00fb7d5

1 Parent(s): 817beb2

Upload code/ with huggingface_hub

Browse files

Files changed (1) hide show

code/inference.py +342 -0

code/inference.py ADDED Viewed

	@@ -0,0 +1,342 @@

+import logging, requests, os, io, glob, time
+import json
+from transformers import BertTokenizer
+from transformers import PreTrainedModel
+import torch
+from fastai.text import *
+import itertools
+from typing import Optional, Dict, Union
+from nltk import sent_tokenize
+from transformers import(
+    AutoModelForSeq2SeqLM,
+    PreTrainedModel,
+    PreTrainedTokenizer,
+)
+from transformers import AutoTokenizer
+import torch
+class QGPipeline:
+    def __init__(
+            self,
+            model: PreTrainedModel,
+            tokenizer: PreTrainedTokenizer,
+            ans_model: PreTrainedModel,
+            ans_tokenizer: PreTrainedTokenizer,
+            qg_format: str,
+            use_cuda: bool
+    ):
+        self.model = model
+        self.tokenizer = tokenizer
+        self.ans_model = ans_model
+        self.ans_tokenizer = ans_tokenizer
+        self.qg_format = qg_format
+        self.device = "cuda" if torch.cuda.is_available() and use_cuda else "cpu"
+        self.model.to(self.device)
+        if self.ans_model is not self.model:
+            self.ans_model.to(self.device)
+        assert self.model.__class__.__name__ in ["MT5ForConditionalGeneration"]
+        self.model_type = "mt5"
+    def __call__(self, inputs: str):
+        inputs = " ".join(inputs.split())
+        sents, answers = self._extract_answers(inputs)
+        flat_answers = list(itertools.chain(*answers))
+        if len(flat_answers) == 0:
+            return []
+        qg_examples = self._prepare_inputs_for_qg_from_answers_hl(sents, answers)
+        qg_inputs = [example['source_text'] for example in qg_examples]
+        questions = self._generate_questions(qg_inputs)
+        output = [{'answer': example['answer'], 'question': que} for example, que in zip(qg_examples, questions)]
+        return output
+    def _generate_questions(self, inputs):
+        inputs = self._tokenize(inputs, padding=True, truncation=True)
+        outs = self.model.generate(
+            input_ids=inputs['input_ids'].to(self.device),
+            attention_mask=inputs['attention_mask'].to(self.device),
+            max_length=80,
+            num_beams=4,
+        )
+        questions = [self.tokenizer.decode(ids, skip_special_tokens=True) for ids in outs]
+        return questions
+    def _extract_answers(self, context):
+        sents, inputs = self._prepare_inputs_for_ans_extraction(context)
+        inputs = self._tokenize(inputs, padding=True, truncation=True)
+        outs = self.ans_model.generate(
+            input_ids=inputs['input_ids'].to(self.device),
+            attention_mask=inputs['attention_mask'].to(self.device),
+            max_length=80,
+        )
+        dec = [self.ans_tokenizer.decode(ids, skip_special_tokens=True) for ids in outs]
+        answers = [item.split('<sep>') for item in dec]
+        answers = [i[:-1] for i in answers]
+        answ_ = []
+        for i in answers:
+            l = []
+            for b in i:
+                l.append(b.replace("<pad>", ""))
+            answ_.append(l)
+        print(answers)
+        return sents, answ_
+    def _tokenize(self,
+                  inputs,
+                  padding=True,
+                  truncation=True,
+                  add_special_tokens=True,
+                  max_length=512
+                  ):
+        inputs = self.tokenizer.batch_encode_plus(
+            inputs,
+            max_length=max_length,
+            add_special_tokens=add_special_tokens,
+            truncation=truncation,
+            padding="max_length" if padding else False,
+            pad_to_max_length=padding,
+            return_tensors="pt"
+        )
+        return inputs
+    def _prepare_inputs_for_ans_extraction(self, text):
+        sents = sent_tokenize(text)
+        inputs = []
+        for i in range(len(sents)):
+            source_text = "extract answers:"
+            for j, sent in enumerate(sents):
+                if i == j:
+                    sent = "<hl> %s <hl>" % sent
+                source_text = "%s %s" % (source_text, sent)
+                source_text = source_text.strip()
+            if self.model_type == "mt5":
+                source_text = source_text + " </s>"
+            inputs.append(source_text)
+        return sents, inputs
+    def _prepare_inputs_for_qg_from_answers_hl(self, sents, answers):
+        inputs = []
+        for i, answer in enumerate(answers):
+            if len(answer) == 0: continue
+            for answer_text in answer:
+                sent = sents[i]
+                sents_copy = sents[:]
+                answer_text = answer_text.strip()
+                try:
+                    ans_start_idx = sent.index(answer_text)
+                    sent = f"{sent[:ans_start_idx]} <hl> {answer_text} <hl> {sent[ans_start_idx + len(answer_text):]}"
+                    sents_copy[i] = sent
+                    source_text = " ".join(sents_copy)
+                    source_text = f"generate question: {source_text}"
+                    if self.model_type == "mt5":
+                        source_text = source_text + " </s>"
+                except:
+                    continue
+                inputs.append({"answer": answer_text, "source_text": source_text})
+        return inputs
+class MultiTaskQAQGPipeline(QGPipeline):
+    def __init__(self, **kwargs):
+        super().__init__(**kwargs)
+    def __call__(self, inputs: Union[Dict, str]):
+        if type(inputs) is str:
+            # do qg
+            return super().__call__(inputs)
+        else:
+            # do qa
+            return self._extract_answer(inputs["question"], inputs["context"])
+    def _prepare_inputs_for_qa(self, question, context):
+        source_text = f"question: {question}  context: {context}"
+        if self.model_type == "mt5":
+            source_text = source_text + " </s>"
+        return source_text
+    def _extract_answer(self, question, context):
+        source_text = self._prepare_inputs_for_qa(question, context)
+        inputs = self._tokenize([source_text], padding=False)
+        outs = self.model.generate(
+            input_ids=inputs['input_ids'].to(self.device),
+            attention_mask=inputs['attention_mask'].to(self.device),
+            max_length=80,
+        )
+        answer = self.tokenizer.decode(outs[0], skip_special_tokens=True)
+        return answer
+SUPPORTED_TASKS = {
+    "multitask-qa-qg": {
+        "impl": MultiTaskQAQGPipeline,
+        "default": {
+            "model": "ozcangundes/mt5-multitask-qa-qg-turkish",
+        }
+    },
+}
+def pipelinex(
+        task: str,
+        model: Optional = None,
+        tokenizer: Optional[Union[str, PreTrainedTokenizer]] = None,
+        qg_format: Optional[str] = "highlight",
+        ans_model: Optional = None,
+        ans_tokenizer: Optional[Union[str, PreTrainedTokenizer]] = None,
+        use_cuda: Optional[bool] = True,
+        **kwargs,
+):
+    # Retrieve the task
+    if task not in SUPPORTED_TASKS:
+        raise KeyError("Unknown task {}, available tasks are {}".format(task, list(SUPPORTED_TASKS.keys())))
+    targeted_task = SUPPORTED_TASKS[task]
+    task_class = targeted_task["impl"]
+    # Use default model/config/tokenizer for the task if no model is provided
+    if model is None:
+        model = targeted_task["default"]["model"]
+    # Try to infer tokenizer from model or config name (if provided as str)
+    if tokenizer is None:
+        if isinstance(model, str):
+            tokenizer = model
+        else:
+            # Impossible to guest what is the right tokenizer here
+            raise Exception(
+                "Impossible to guess which tokenizer to use. "
+                "Please provided a PretrainedTokenizer class or a path/identifier to a pretrained tokenizer."
+            )
+    # Instantiate tokenizer if needed
+    if isinstance(tokenizer, (str, tuple)):
+        if isinstance(tokenizer, tuple):
+            # For tuple we have (tokenizer name, {kwargs})
+            tokenizer = AutoTokenizer.from_pretrained(tokenizer[0], **tokenizer[1])
+        else:
+            tokenizer = AutoTokenizer.from_pretrained(tokenizer)
+    # Instantiate model if needed
+    if isinstance(model, str):
+        model = AutoModelForSeq2SeqLM.from_pretrained(model)
+    print(ans_model)
+    return task_class(model=model, tokenizer=tokenizer, ans_model=model, ans_tokenizer=tokenizer, qg_format=qg_format,
+                      use_cuda=use_cuda)
+################################################################################################
+logger = logging.getLogger(__name__)
+logger.setLevel(logging.DEBUG)
+JSON_CONTENT_TYPE = 'application/json'
+# loads the model into memory from disk and returns it
+def model_fn():
+    model = AutoModelForSeq2SeqLM.from_pretrained("canovich/myprivateee")
+    return model
+# Perform prediction on the deserialized object, with the loaded model
+def predict_fn(input, model,tokenizer):
+    logger.info("Calling model")
+    start_time = time.time()
+     #pipelines.py script in the cloned repo
+    multimodel = pipelinex("multitask-qa-qg",tokenizer=tokenizer,model=model)
+    answers = multimodel(input)
+    print("--- Inference time: %s seconds ---" % (time.time() - start_time))
+    return answers
+# Deserialize the Invoke request body into an object we can perform prediction on
+def input_fn(request_body, content_type=JSON_CONTENT_TYPE):
+    logger.info('Deserializing the input data.')
+    # process an jsonlines uploaded to the endpoint
+    if content_type == JSON_CONTENT_TYPE: return request_body["text"]
+    raise Exception('Requested unsupported ContentType in content_type: {}'.format(content_type))
+# Serialize the prediction result into the desired response content type
+def output_fn(prediction, accept=JSON_CONTENT_TYPE):
+    logger.info('Serializing the generated output.')
+    if accept == JSON_CONTENT_TYPE: return json.dumps(prediction), accept
+    raise Exception('Requested unsupported ContentType in Accept: {}'.format(accept))