Spaces:

Dpedrinho01
/

api_host

Sleeping

App Files Files Community

Pedrinho-Dev01 commited on Apr 15

Commit

c7d60e2

1 Parent(s): a1de573

API DeBERTa Update

Browse files

Files changed (1) hide show

api.py +24 -7

api.py CHANGED Viewed

@@ -1,6 +1,7 @@
 """
 Spam Detection + Emotion Analysis API
-Ensemble of RoBERTa-Large + ELECTRA-Large classifiers.
 Run with: uvicorn api:app --reload
 """
@@ -15,6 +16,7 @@ from fastapi.middleware.cors import CORSMiddleware
 from pydantic import BaseModel
 from transformers import (
     AutoTokenizer,
     ElectraForSequenceClassification,
     RobertaForSequenceClassification,
 )
@@ -25,6 +27,7 @@ ROBERTA_SPAM_REPO   = "Dpedrinho01/trained_roberta_large"
 ELECTRA_SPAM_REPO   = "Dpedrinho01/trained_electra_large"
 ROBERTA_EMOTION_REPO = "Dpedrinho01/trained_roberta_emotion"
 ELECTRA_EMOTION_REPO = "Dpedrinho01/trained_electra_emotion"
 DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
@@ -124,17 +127,19 @@ roberta_spam_bundle: Optional[SpamModelBundle] = None
 electra_spam_bundle: Optional[SpamModelBundle] = None
 roberta_emotion_bundle: Optional[EmotionModelBundle] = None
 electra_emotion_bundle: Optional[EmotionModelBundle] = None
 @app.on_event("startup")
 def load_models():
     global roberta_spam_bundle, electra_spam_bundle
-    global roberta_emotion_bundle, electra_emotion_bundle
     roberta_spam_bundle = SpamModelBundle(ROBERTA_SPAM_REPO, RobertaForSequenceClassification)
     electra_spam_bundle = SpamModelBundle(ELECTRA_SPAM_REPO, ElectraForSequenceClassification)
     roberta_emotion_bundle = EmotionModelBundle(ROBERTA_EMOTION_REPO, RobertaForSequenceClassification)
     electra_emotion_bundle = EmotionModelBundle(ELECTRA_EMOTION_REPO, ElectraForSequenceClassification)
     print(f"All models ready on {DEVICE}.")
@@ -179,6 +184,7 @@ class EmotionPredictResponse(BaseModel):
     all_scores: list[EmotionScore]  # ensemble averaged, sorted by probability
     roberta: Optional[EmotionModelResult] = None
     electra: Optional[EmotionModelResult] = None
 class EmlRequest(BaseModel):
@@ -201,15 +207,17 @@ def classify_spam(proba: float, threshold: float) -> dict:
 def ensemble_emotions(
     roberta_probas: dict[str, float],
     electra_probas: dict[str, float],
     threshold_per_class: dict[str, float],
 ) -> tuple[list[str], list[EmotionScore]]:
-    """Average both models' probabilities and apply per-class thresholds."""
     all_scores: list[EmotionScore] = []
     detected: list[str] = []
     for emotion, r_prob in roberta_probas.items():
         e_prob = electra_probas.get(emotion, 0.0)
-        avg_prob = round((r_prob + e_prob) / 2, 4)
         threshold = threshold_per_class.get(emotion, 0.4)
         is_detected = avg_prob >= threshold
         all_scores.append(EmotionScore(
@@ -285,7 +293,11 @@ def health():
         "status": "healthy",
         "device": DEVICE,
         "spam_models_loaded": roberta_spam_bundle is not None and electra_spam_bundle is not None,
-        "emotion_models_loaded": roberta_emotion_bundle is not None and electra_emotion_bundle is not None,
     }
@@ -344,10 +356,14 @@ def predict_emotion(req: EmotionPredictRequest):
     roberta_probas = roberta_emotion_bundle.predict_proba(req.text)
     electra_probas = electra_emotion_bundle.predict_proba(req.text)
-    # Use roberta's per-class thresholds (both models share the same config structure)
     detected, all_scores = ensemble_emotions(
-        roberta_probas, electra_probas, roberta_emotion_bundle.threshold_per_class
     )
     return EmotionPredictResponse(
@@ -356,6 +372,7 @@ def predict_emotion(req: EmotionPredictRequest):
         all_scores=all_scores,
         roberta=_emotion_model_result(roberta_emotion_bundle, roberta_probas),
         electra=_emotion_model_result(electra_emotion_bundle, electra_probas),
     )

 """
 Spam Detection + Emotion Analysis API
+Ensemble of RoBERTa-Large + ELECTRA-Large classifiers for spam,
+and RoBERTa-Large + ELECTRA-Large + DeBERTa-v3-Large for emotion.
 Run with: uvicorn api:app --reload
 """
 from pydantic import BaseModel
 from transformers import (
     AutoTokenizer,
+    DebertaV2ForSequenceClassification,
     ElectraForSequenceClassification,
     RobertaForSequenceClassification,
 )
 ELECTRA_SPAM_REPO   = "Dpedrinho01/trained_electra_large"
 ROBERTA_EMOTION_REPO = "Dpedrinho01/trained_roberta_emotion"
 ELECTRA_EMOTION_REPO = "Dpedrinho01/trained_electra_emotion"
+DEBERTA_EMOTION_REPO = "Dpedrinho01/trained_deberta_v3_large_emotion"
 DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
 electra_spam_bundle: Optional[SpamModelBundle] = None
 roberta_emotion_bundle: Optional[EmotionModelBundle] = None
 electra_emotion_bundle: Optional[EmotionModelBundle] = None
+deberta_emotion_bundle: Optional[EmotionModelBundle] = None
 @app.on_event("startup")
 def load_models():
     global roberta_spam_bundle, electra_spam_bundle
+    global roberta_emotion_bundle, electra_emotion_bundle, deberta_emotion_bundle
     roberta_spam_bundle = SpamModelBundle(ROBERTA_SPAM_REPO, RobertaForSequenceClassification)
     electra_spam_bundle = SpamModelBundle(ELECTRA_SPAM_REPO, ElectraForSequenceClassification)
     roberta_emotion_bundle = EmotionModelBundle(ROBERTA_EMOTION_REPO, RobertaForSequenceClassification)
     electra_emotion_bundle = EmotionModelBundle(ELECTRA_EMOTION_REPO, ElectraForSequenceClassification)
+    deberta_emotion_bundle = EmotionModelBundle(DEBERTA_EMOTION_REPO, DebertaV2ForSequenceClassification)
     print(f"All models ready on {DEVICE}.")
     all_scores: list[EmotionScore]  # ensemble averaged, sorted by probability
     roberta: Optional[EmotionModelResult] = None
     electra: Optional[EmotionModelResult] = None
+    deberta: Optional[EmotionModelResult] = None
 class EmlRequest(BaseModel):
 def ensemble_emotions(
     roberta_probas: dict[str, float],
     electra_probas: dict[str, float],
+    deberta_probas: dict[str, float],
     threshold_per_class: dict[str, float],
 ) -> tuple[list[str], list[EmotionScore]]:
+    """Average all three models' probabilities and apply per-class thresholds."""
     all_scores: list[EmotionScore] = []
     detected: list[str] = []
     for emotion, r_prob in roberta_probas.items():
         e_prob = electra_probas.get(emotion, 0.0)
+        d_prob = deberta_probas.get(emotion, 0.0)
+        avg_prob = round((r_prob + e_prob + d_prob) / 3, 4)
         threshold = threshold_per_class.get(emotion, 0.4)
         is_detected = avg_prob >= threshold
         all_scores.append(EmotionScore(
         "status": "healthy",
         "device": DEVICE,
         "spam_models_loaded": roberta_spam_bundle is not None and electra_spam_bundle is not None,
+        "emotion_models_loaded": (
+            roberta_emotion_bundle is not None
+            and electra_emotion_bundle is not None
+            and deberta_emotion_bundle is not None
+        ),
     }
     roberta_probas = roberta_emotion_bundle.predict_proba(req.text)
     electra_probas = electra_emotion_bundle.predict_proba(req.text)
+    deberta_probas = deberta_emotion_bundle.predict_proba(req.text)
+    # Use roberta's per-class thresholds (all models share the same config structure)
     detected, all_scores = ensemble_emotions(
+        roberta_probas,
+        electra_probas,
+        deberta_probas,
+        roberta_emotion_bundle.threshold_per_class,
     )
     return EmotionPredictResponse(
         all_scores=all_scores,
         roberta=_emotion_model_result(roberta_emotion_bundle, roberta_probas),
         electra=_emotion_model_result(electra_emotion_bundle, electra_probas),
+        deberta=_emotion_model_result(deberta_emotion_bundle, deberta_probas),
     )