ebhon commited on
Commit
b677cf4
·
verified ·
1 Parent(s): d51ea80

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +10 -4
app.py CHANGED
@@ -15,20 +15,26 @@ from sklearn.feature_extraction.text import CountVectorizer
15
 
16
  nltk_data_path = '/home/user/nltk_data'
17
 
 
18
  if not os.path.exists(nltk_data_path):
19
  os.makedirs(nltk_data_path)
20
 
 
21
  nltk.data.path.append(nltk_data_path)
22
- if not os.path.exists(os.path.join(nltk_data_path, "tokenizers/punkt")):
23
- nltk.download('punkt', download_dir=nltk_data_path)
24
- if not os.path.exists(os.path.join(nltk_data_path, "corpora/stopwords")):
25
- nltk.download('stopwords', download_dir=nltk_data_path)
26
 
27
  from nltk.corpus import stopwords
28
  from nltk.tokenize import sent_tokenize
29
 
 
30
  stop_words = set(stopwords.words('english'))
31
 
 
 
 
 
32
 
33
  model = load_model('model_improved.keras')
34
  vectorizer = joblib.load('vectorizer.joblib')
 
15
 
16
  nltk_data_path = '/home/user/nltk_data'
17
 
18
+
19
  if not os.path.exists(nltk_data_path):
20
  os.makedirs(nltk_data_path)
21
 
22
+
23
  nltk.data.path.append(nltk_data_path)
24
+ nltk.download('punkt', download_dir=nltk_data_path)
25
+ nltk.download('stopwords', download_dir=nltk_data_path)
26
+
 
27
 
28
  from nltk.corpus import stopwords
29
  from nltk.tokenize import sent_tokenize
30
 
31
+
32
  stop_words = set(stopwords.words('english'))
33
 
34
+
35
+ sample_text = "This is a test sentence. Let's see if it works!"
36
+ sentences = sent_tokenize(sample_text)
37
+ print(sentences)
38
 
39
  model = load_model('model_improved.keras')
40
  vectorizer = joblib.load('vectorizer.joblib')