VarunRavichander commited on
Commit
eb9df21
·
verified ·
1 Parent(s): acfcab4

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +29 -9
app.py CHANGED
@@ -9,15 +9,35 @@ import os
9
  import nltk
10
  import os
11
 
12
- # Set up NLTK data path
13
- NLTK_DATA_PATH = os.path.join(os.getcwd(), 'nltk_data')
14
- os.makedirs(NLTK_DATA_PATH, exist_ok=True)
15
- nltk.data.path.append(NLTK_DATA_PATH)
16
-
17
- # Download all required NLTK resources
18
- resources = ['punkt', 'averaged_perceptron_tagger', 'wordnet', 'omw-1.4']
19
- for resource in resources:
20
- nltk.download(resource, quiet=True, download_dir=NLTK_DATA_PATH)
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
21
 
22
 
23
  def initialize_humanizer():
 
9
  import nltk
10
  import os
11
 
12
+
13
+
14
+
15
+ import nltk
16
+ import os
17
+ from nltk.tokenize.punkt import PunktLanguageVars
18
+
19
+ # Create and set NLTK data directory
20
+ NLTK_DATA = os.path.join(os.getcwd(), 'nltk_data')
21
+ os.makedirs(NLTK_DATA, exist_ok=True)
22
+ nltk.data.path.append(NLTK_DATA)
23
+
24
+ # Download essential resources
25
+ resources = [
26
+ ('punkt', 'tokenizers/punkt'),
27
+ ('averaged_perceptron_tagger', 'taggers/averaged_perceptron_tagger'),
28
+ ('wordnet', 'corpora/wordnet'),
29
+ ]
30
+
31
+ # Download each resource
32
+ for resource, path in resources:
33
+ try:
34
+ nltk.data.find(path)
35
+ except LookupError:
36
+ nltk.download(resource, download_dir=NLTK_DATA)
37
+
38
+ # Initialize PunktLanguageVars
39
+ punkt_vars = PunktLanguageVars()
40
+
41
 
42
 
43
  def initialize_humanizer():