Spaces:

davidepanza
/

test2text

Sleeping

davidepanza commited on Jun 19, 2025

Commit

ec294c1

verified ·

1 Parent(s): 79fcbeb

Update app/backend/text_processing.py

Files changed (1) hide show

app/backend/text_processing.py CHANGED Viewed

@@ -6,7 +6,7 @@ import re
 def sent_tokenize(text):
-    """Simple sentence tokenizer using regex - no NLTK needed"""
     # Split on sentence endings followed by whitespace and capital letter
     sentences = re.split(r'(?<=[.!?])\s+(?=[A-Z])', text)

 def sent_tokenize(text):
+    """Simple sentence tokenizer using regex (simpler alternative to NLTK)"""
     # Split on sentence endings followed by whitespace and capital letter
     sentences = re.split(r'(?<=[.!?])\s+(?=[A-Z])', text)