Spaces:

sentimentanalyzer01
/

sentiment_analyzer

Runtime error

App Files Files Community

sentimentanalyzer01 commited on Mar 21

Commit

cd60e73

verified ·

1 Parent(s): 42b797d

Update app.py

Browse files

Files changed (1) hide show

app.py +76 -13

app.py CHANGED Viewed

@@ -41,7 +41,7 @@ def clean_russian_text(text):
     return text
 # ============================================================
-# ПОЛНЫЙ КЛАСС ОНТОЛОГИИ
 # ============================================================
 class OntologyEmotionModel:
@@ -139,12 +139,42 @@ class OntologyEmotionModel:
     def init_ontology_level2(self):
         self.linguistic_rules = {
-            'усилители': {'words': ['очень', 'сильно', 'крайне', 'чрезвычайно', 'невероятно', 'абсолютно'], 'effect': 'increase_arousal', 'weight': 0.3, 'learnable': True},
-            'ослабители': {'words': ['слегка', 'немного', 'чуть-чуть', 'отчасти', 'несколько'], 'effect': 'decrease_arousal', 'weight': -0.2, 'learnable': True},
-            'отрицания': {'words': ['не', 'ни', 'нет', 'нельзя', 'невозможно'], 'effect': 'negation', 'weight': -0.5, 'learnable': True},
-            'восклицания': {'patterns': [r'!+', r'\?+', r'\.{3,}'], 'effect': 'increase_arousal', 'weight': 0.4, 'learnable': True},
-            'вопросительные': {'patterns': [r'\?+'], 'effect': 'uncertainty', 'weight': 0.2, 'learnable': True},
-            'сарказм_маркеры': {'words': ['какой', 'такой', 'прям', 'ага', 'ну да'], 'effect': 'sarcasm', 'weight': 0.3, 'learnable': True}
         }
     def add_empirical_knowledge(self, text: str, emotion: str, confidence: float):
@@ -194,7 +224,8 @@ class OntologyEmotionModel:
                 for word in rule['words']:
                     if word in lemmas:
                         rules_applied.append(f"{category}: {word}")
-                        effect = rule['effect']; weight = rule['weight']
                         if effect == 'increase_arousal':
                             adjustments['arousal'] += weight
                         elif effect == 'decrease_arousal':
@@ -238,6 +269,16 @@ class OntologyEmotionModel:
             adjustments['sarcasm'] += 0.5
             rules_applied.append(f"контраст тональности: позитив {pos_words[:2]} vs негатив {neg_words[:2]}")
         return {'rules_applied': rules_applied, 'adjustments': adjustments, 'lemmas': lemmas}
     def calculate_disagreement(self, pred1: Dict, pred2: Dict) -> float:
@@ -266,24 +307,39 @@ class OntologyEmotionModel:
         conf_mult = 1.0 + adj['arousal'] * 0.2 + adj['uncertainty'] * 0.1 - abs(adj['valence']) * 0.1
         conf_mult = np.clip(conf_mult, 0.5, 1.5)
         new_confidence = original_confidence * conf_mult
         new_emotion = original_emotion
         for rule in rules:
             if rule.startswith("инверсия негатива:"):
                 new_emotion = 'радость'
                 break
             elif rule.startswith("инверсия позитива:"):
-                new_emotion = 'грусть' if adj['arousal'] <= 0.3 else 'злость'
                 break
-        if adj['sarcasm'] > 0.5 and original_emotion == 'радость':
             new_emotion = 'сарказм'
-            new_confidence *= 0.8
         if any('восклицание' in r for r in rules):
             new_confidence = min(new_confidence * 1.2, 1.0)
-        return {'emotion': new_emotion, 'confidence': new_confidence, 'rules_applied': rules}
     def get_ontology_analysis(self, text: str, model_prediction: Dict) -> Dict:
         rule_analysis = self.apply_linguistic_rules(text)
@@ -352,6 +408,10 @@ class EmotionBERT(nn.Module):
             return logits, conf
         return logits
 class CascadeEmotionClassifier:
     def __init__(self, lstm_model, bert_model, vocab, tokenizer, label_encoder, ontology_model, threshold=0.95, device='cpu', max_length_lstm=100, max_length_bert=128):
         self.lstm_model = lstm_model
@@ -532,6 +592,8 @@ async def predict(text: str = Form(...)):
         return JSONResponse({"error": "Введите хотя бы 3 символа."}, status_code=400)
     try:
         result = classifier.predict(text)
         rules_display = []
         for rule in result['rules_applied'][:10]:
             if ':' in rule:
@@ -539,13 +601,14 @@ async def predict(text: str = Form(...)):
                 rules_display.append(f"<span class='rule-tag'>{cat}: {val}</span>")
             else:
                 rules_display.append(f"<span class='rule-tag'>{rule}</span>")
         return JSONResponse({
             "success": True,
             "emotion": result['predicted_emotion'],
             "confidence": f"{result['confidence']*100:.1f}%",
             "used_model": result['used_model'],
             "rules": "".join(rules_display) if rules_display else "Нет правил",
-            "was_corrected": result['was_corrected_by_ontology']
         })
     except Exception as e:
         return JSONResponse({"error": str(e)}, status_code=500)

     return text
 # ============================================================
+# ПОЛНЫЙ КЛАСС ОНТОЛОГИИ (исправленный)
 # ============================================================
 class OntologyEmotionModel:
     def init_ontology_level2(self):
         self.linguistic_rules = {
+            'усилители': {
+                'words': ['очень', 'сильно', 'крайне', 'чрезвычайно', 'невероятно', 'абсолютно'],
+                'effect': 'increase_arousal',
+                'weight': 0.3,
+                'learnable': True
+            },
+            'ослабители': {
+                'words': ['слегка', 'немного', 'чуть-чуть', 'отчасти', 'несколько'],
+                'effect': 'decrease_arousal',
+                'weight': -0.2,
+                'learnable': True
+            },
+            'отрицания': {
+                'words': ['не', 'ни', 'нет', 'нельзя', 'невозможно'],
+                'effect': 'negation',
+                'weight': -0.5,
+                'learnable': True
+            },
+            'восклицания': {
+                'patterns': [r'!+', r'\?+'],
+                'effect': 'increase_arousal',
+                'weight': 0.4,
+                'learnable': True
+            },
+            'вопросительные': {
+                'patterns': [r'\?+'],
+                'effect': 'uncertainty',
+                'weight': 0.2,
+                'learnable': True
+            },
+            'сарказм_маркеры': {
+                'words': ['какой', 'такой', 'прям', 'ага', 'ну да', 'конечно', 'отличная работа', 'прекрасно', 'замечательно', 'как всегда'],
+                'effect': 'sarcasm',
+                'weight': 0.6,
+                'learnable': True
+            }
         }
     def add_empirical_knowledge(self, text: str, emotion: str, confidence: float):
                 for word in rule['words']:
                     if word in lemmas:
                         rules_applied.append(f"{category}: {word}")
+                        effect = rule['effect']
+                        weight = rule['weight']
                         if effect == 'increase_arousal':
                             adjustments['arousal'] += weight
                         elif effect == 'decrease_arousal':
             adjustments['sarcasm'] += 0.5
             rules_applied.append(f"контраст тональности: позитив {pos_words[:2]} vs негатив {neg_words[:2]}")
+        # Дополнительная проверка на саркастические фразы
+        sarcasm_phrases = ['конечно', 'ага', 'ну да', 'как всегда', 'отличная работа', 'прекрасно', 'замечательно']
+        for phrase in sarcasm_phrases:
+            if phrase in text.lower():
+                adjustments['sarcasm'] += 0.6
+                rules_applied.append(f"саркастическая фраза: {phrase}")
+        if adjustments['sarcasm'] > 0.5:
+            rules_applied.append("обнаружен сарказм")
         return {'rules_applied': rules_applied, 'adjustments': adjustments, 'lemmas': lemmas}
     def calculate_disagreement(self, pred1: Dict, pred2: Dict) -> float:
         conf_mult = 1.0 + adj['arousal'] * 0.2 + adj['uncertainty'] * 0.1 - abs(adj['valence']) * 0.1
         conf_mult = np.clip(conf_mult, 0.5, 1.5)
         new_confidence = original_confidence * conf_mult
+        # Ограничиваем максимум 1.0 (100%)
+        new_confidence = min(new_confidence, 1.0)
         new_emotion = original_emotion
+        # Инверсия на основе правил
         for rule in rules:
             if rule.startswith("инверсия негатива:"):
                 new_emotion = 'радость'
                 break
             elif rule.startswith("инверсия позитива:"):
+                if adj['arousal'] > 0.3:
+                    new_emotion = 'злость'
+                else:
+                    new_emotion = 'грусть'
                 break
+        # Сарказм (контраст + маркеры)
+        sarcasm_flag = adj['sarcasm'] > 0.5
+        if sarcasm_flag:
             new_emotion = 'сарказм'
+            new_confidence = min(new_confidence * 0.8, 0.9)
+            if "саркастическая фраза" in str(rules):
+                new_confidence = min(new_confidence * 1.1, 0.95)
+        # Восклицания
         if any('восклицание' in r for r in rules):
             new_confidence = min(new_confidence * 1.2, 1.0)
+        return {
+            'emotion': new_emotion,
+            'confidence': new_confidence,
+            'rules_applied': rules
+        }
     def get_ontology_analysis(self, text: str, model_prediction: Dict) -> Dict:
         rule_analysis = self.apply_linguistic_rules(text)
             return logits, conf
         return logits
+# ============================================================
+# КАСКАДНЫЙ КЛАССИФИКАТОР (исправленный)
+# ============================================================
 class CascadeEmotionClassifier:
     def __init__(self, lstm_model, bert_model, vocab, tokenizer, label_encoder, ontology_model, threshold=0.95, device='cpu', max_length_lstm=100, max_length_bert=128):
         self.lstm_model = lstm_model
         return JSONResponse({"error": "Введите хотя бы 3 символа."}, status_code=400)
     try:
         result = classifier.predict(text)
+        # Форматируем правила для отображения
         rules_display = []
         for rule in result['rules_applied'][:10]:
             if ':' in rule:
                 rules_display.append(f"<span class='rule-tag'>{cat}: {val}</span>")
             else:
                 rules_display.append(f"<span class='rule-tag'>{rule}</span>")
         return JSONResponse({
             "success": True,
             "emotion": result['predicted_emotion'],
             "confidence": f"{result['confidence']*100:.1f}%",
             "used_model": result['used_model'],
             "rules": "".join(rules_display) if rules_display else "Нет правил",
+            "was_corrected": str(result['was_corrected_by_ontology'])
         })
     except Exception as e:
         return JSONResponse({"error": str(e)}, status_code=500)