space_20

Sleeping

Frenchizer commited on Feb 15, 2025

Commit

a3aabf5

verified ·

1 Parent(s): 7821050

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -39,34 +39,31 @@ def preprocess_text(text: str):
     if capitalized_text != text:
         result["spell_suggestions"].append({
             "original": text,
-            "corrected": capitalized_text,
-            "source": "capitalization"  # Track the source of the correction
         })
         text = capitalized_text  # Update text for further processing
-    # TextBlob spell check
     blob = TextBlob(text)
     corrected = str(blob.correct())
     if corrected != text:
-        print(f"TextBlob suggestion: {text} → {corrected}")  # Debugging
         result["spell_suggestions"].append({
             "original": text,
-            "corrected": corrected,
-            "source": "TextBlob"  # Track the source of the correction
         })
     # Transformer spell check
     spell_checked = spell_checker(text, max_length=512)[0]['generated_text']
     if spell_checked != text and spell_checked != corrected:
-        print(f"Transformer suggestion: {text} → {spell_checked}")  # Debugging
         result["spell_suggestions"].append({
             "original": text,
-            "corrected": spell_checked,
-            "source": "Transformer"  # Track the source of the correction
         })
     # Add entities and tags
-    doc = nlp(text)
     result["entities"] = [{"text": ent.text, "label": ent.label_} for ent in doc.ents]
     result["tags"] = [token.text for token in doc if token.text.startswith(('#', '@'))]

     if capitalized_text != text:
         result["spell_suggestions"].append({
             "original": text,
+            "corrected": capitalized_text
         })
         text = capitalized_text  # Update text for further processing
+    # Find and record positions of corrections
+    doc = nlp(text)
+    # TextBlob spell check with position tracking
     blob = TextBlob(text)
     corrected = str(blob.correct())
     if corrected != text:
         result["spell_suggestions"].append({
             "original": text,
+            "corrected": corrected
         })
     # Transformer spell check
     spell_checked = spell_checker(text, max_length=512)[0]['generated_text']
     if spell_checked != text and spell_checked != corrected:
         result["spell_suggestions"].append({
             "original": text,
+            "corrected": spell_checked
         })
     # Add entities and tags
     result["entities"] = [{"text": ent.text, "label": ent.label_} for ent in doc.ents]
     result["tags"] = [token.text for token in doc if token.text.startswith(('#', '@'))]