Spaces:

Ravenok
/

statosphere-backend

Running on Zero

App Files Files Community

Lord-Raven commited on Aug 27, 2024

Commit

50b814c

1 Parent(s): 09439d2

Experimenting with few-shot classification.

Browse files

Files changed (2) hide show

app.py +40 -2
requirements.txt +1 -0

app.py CHANGED Viewed

@@ -6,6 +6,7 @@ from transformers import pipeline
 from optimum.onnxruntime import ORTModelForSequenceClassification
 from fastapi import FastAPI
 from fastapi.middleware.cors import CORSMiddleware
 # CORS Config
 app = FastAPI()
@@ -18,6 +19,26 @@ app.add_middleware(
     allow_headers=["*"],
 )
 # "xenova/mobilebert-uncased-mnli" "typeform/mobilebert-uncased-mnli" Fast but small--same as bundled in Statosphere
 # "xenova/deberta-v3-base-tasksource-nli" Not impressed
 # "Xenova/bart-large-mnli" A bit slow
@@ -29,22 +50,39 @@ tokenizer_name = "cross-encoder/nli-deberta-v3-small"
 model = ORTModelForSequenceClassification.from_pretrained(model_name, file_name=file_name)
 tokenizer = AutoTokenizer.from_pretrained(tokenizer_name, model_max_length=512)
 # file = cached_download("https://huggingface.co/" + model_name + "")
 # sess = InferenceSession(file)
 classifier = pipeline(task="zero-shot-classification", model=model, tokenizer=tokenizer)
-def zero_shot_classification(data_string, request: gradio.Request):
     if request:
         if request.headers["origin"] not in ["https://statosphere-3704059fdd7e.c5v4v4jx6pq5.win", "https://crunchatize-77a78ffcc6a6.c5v4v4jx6pq5.win", "https://ravenok-statosphere-backend.hf.space"]:
             return "{}"
     data = json.loads(data_string)
     results = classifier(data['sequence'], candidate_labels=data['candidate_labels'], hypothesis_template=data['hypothesis_template'], multi_label=data['multi_label'])
     response_string = json.dumps(results)
     return response_string
 gradio_interface = gradio.Interface(
-    fn = zero_shot_classification,
     inputs = gradio.Textbox(label="JSON Input"),
     outputs = gradio.Textbox()
 )

 from optimum.onnxruntime import ORTModelForSequenceClassification
 from fastapi import FastAPI
 from fastapi.middleware.cors import CORSMiddleware
+from setfit import SetFitModel
 # CORS Config
 app = FastAPI()
     allow_headers=["*"],
 )
+class OnnxSetFitModel:
+    def __init__(self, ort_model, tokenizer, model_head):
+        self.ort_model = ort_model
+        self.tokenizer = tokenizer
+        self.model_head = model_head
+    def predict(self, inputs):
+        encoded_inputs = self.tokenizer(
+            inputs, padding=True, truncation=True, return_tensors="pt"
+        ).to(self.ort_model.device)
+        outputs = self.ort_model(**encoded_inputs)
+        embeddings = mean_pooling(
+            outputs["last_hidden_state"], encoded_inputs["attention_mask"]
+        )
+        return self.model_head.predict(embeddings.cpu())
+    def __call__(self, inputs):
+        return self.predict(inputs)
 # "xenova/mobilebert-uncased-mnli" "typeform/mobilebert-uncased-mnli" Fast but small--same as bundled in Statosphere
 # "xenova/deberta-v3-base-tasksource-nli" Not impressed
 # "Xenova/bart-large-mnli" A bit slow
 model = ORTModelForSequenceClassification.from_pretrained(model_name, file_name=file_name)
 tokenizer = AutoTokenizer.from_pretrained(tokenizer_name, model_max_length=512)
+few_shot_model_name = "moshew/bge-small-en-v1.5_setfit-sst2-english"
+few_shot_model = setFitModel.from_pretrained(few_shot_model_name)
+few_shot_tokenizer = AutoTokenizer.from_pretrained('bge_auto_opt_04', model_max_length=512)
+ort_model = ORTModelForFeatureExtraction.from_pretrained('bge_auto_opt_O4')
+onnx_few_shot_model = OnnxSetFitModel(ort_model, tokenizer, model.model_head)
 # file = cached_download("https://huggingface.co/" + model_name + "")
 # sess = InferenceSession(file)
 classifier = pipeline(task="zero-shot-classification", model=model, tokenizer=tokenizer)
+def classify(data_string, request: gradio.Request):
     if request:
         if request.headers["origin"] not in ["https://statosphere-3704059fdd7e.c5v4v4jx6pq5.win", "https://crunchatize-77a78ffcc6a6.c5v4v4jx6pq5.win", "https://ravenok-statosphere-backend.hf.space"]:
             return "{}"
     data = json.loads(data_string)
+    if (data['task'] == 'few_shot_classification')
+        return few_shot_classification
+    else
+        return zero_shot_classification
+def zero_shot_classification(data):
     results = classifier(data['sequence'], candidate_labels=data['candidate_labels'], hypothesis_template=data['hypothesis_template'], multi_label=data['multi_label'])
     response_string = json.dumps(results)
     return response_string
+def few_shot_classification(data):
+    results = onnx_few_shot_model(data['sequence'])
+    response_string = json.dumps(results)
+    return response_string
 gradio_interface = gradio.Interface(
+    fn = classify,
     inputs = gradio.Textbox(label="JSON Input"),
     outputs = gradio.Textbox()
 )

requirements.txt CHANGED Viewed

@@ -2,5 +2,6 @@ fastapi==0.88.0
 json5==0.9.10
 numpy==1.23.4
 optimum[exporters,onnxruntime]==1.21.3
 torch==1.12.1
 torchvision==0.13.1

 json5==0.9.10
 numpy==1.23.4
 optimum[exporters,onnxruntime]==1.21.3
+setfit==1.0.3
 torch==1.12.1
 torchvision==0.13.1