Spaces:

ebhon
/

text-classification-nlp

Build error

ebhon commited on Nov 4, 2024

Commit

b677cf4

verified ·

1 Parent(s): d51ea80

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -15,20 +15,26 @@ from sklearn.feature_extraction.text import CountVectorizer
 nltk_data_path = '/home/user/nltk_data'
 if not os.path.exists(nltk_data_path):
     os.makedirs(nltk_data_path)
 nltk.data.path.append(nltk_data_path)
-if not os.path.exists(os.path.join(nltk_data_path, "tokenizers/punkt")):
-    nltk.download('punkt', download_dir=nltk_data_path)
-if not os.path.exists(os.path.join(nltk_data_path, "corpora/stopwords")):
-    nltk.download('stopwords', download_dir=nltk_data_path)
 from nltk.corpus import stopwords
 from nltk.tokenize import sent_tokenize
 stop_words = set(stopwords.words('english'))
 model = load_model('model_improved.keras')
 vectorizer = joblib.load('vectorizer.joblib')

 nltk_data_path = '/home/user/nltk_data'
 if not os.path.exists(nltk_data_path):
     os.makedirs(nltk_data_path)
 nltk.data.path.append(nltk_data_path)
+nltk.download('punkt', download_dir=nltk_data_path)
+nltk.download('stopwords', download_dir=nltk_data_path)
 from nltk.corpus import stopwords
 from nltk.tokenize import sent_tokenize
 stop_words = set(stopwords.words('english'))
+sample_text = "This is a test sentence. Let's see if it works!"
+sentences = sent_tokenize(sample_text)
+print(sentences)
 model = load_model('model_improved.keras')
 vectorizer = joblib.load('vectorizer.joblib')