Update app.py
Browse files
app.py
CHANGED
|
@@ -8,26 +8,34 @@ import datasets
|
|
| 8 |
|
| 9 |
import pandas as pd
|
| 10 |
import nltk
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 11 |
import numpy as np
|
| 12 |
import os
|
| 13 |
import re #regular expressions
|
| 14 |
-
|
|
|
|
| 15 |
from sklearn.feature_extraction.text import CountVectorizer # for bag of words (bow)
|
| 16 |
from sklearn.feature_extraction.text import TfidfVectorizer #for tfidf
|
| 17 |
-
from nltk import pos_tag # for parts of speech
|
| 18 |
from sklearn.metrics import pairwise_distances # cosine similarity
|
| 19 |
-
from
|
| 20 |
-
|
| 21 |
from gensim.models import Word2Vec, KeyedVectors
|
| 22 |
import gensim.downloader as api
|
| 23 |
-
|
| 24 |
import gradio as gr
|
| 25 |
import time
|
| 26 |
-
|
| 27 |
-
|
| 28 |
-
# nltk.download('averaged_perceptron_tagger')
|
| 29 |
-
nltk.download('wordnet')
|
| 30 |
-
nltk.download('stopwords')
|
| 31 |
|
| 32 |
|
| 33 |
# Take Rachel as main character
|
|
|
|
| 8 |
|
| 9 |
import pandas as pd
|
| 10 |
import nltk
|
| 11 |
+
from nltk import word_tokenize
|
| 12 |
+
from nltk.corpus import stopwords
|
| 13 |
+
from nltk.stem import wordnet # for lemmtization
|
| 14 |
+
from nltk import pos_tag # for parts of speech
|
| 15 |
+
nltk.download('omw-1.4') #this is for the .apply() function to work
|
| 16 |
+
nltk.download('punkt')
|
| 17 |
+
nltk.download('averaged_perceptron_tagger')
|
| 18 |
+
nltk.download('wordnet')
|
| 19 |
+
nltk.download('stopwords')
|
| 20 |
+
|
| 21 |
+
|
| 22 |
import numpy as np
|
| 23 |
import os
|
| 24 |
import re #regular expressions
|
| 25 |
+
import time
|
| 26 |
+
|
| 27 |
from sklearn.feature_extraction.text import CountVectorizer # for bag of words (bow)
|
| 28 |
from sklearn.feature_extraction.text import TfidfVectorizer #for tfidf
|
|
|
|
| 29 |
from sklearn.metrics import pairwise_distances # cosine similarity
|
| 30 |
+
from sklearn.metrics.pairwise import cosine_similarity
|
| 31 |
+
|
| 32 |
from gensim.models import Word2Vec, KeyedVectors
|
| 33 |
import gensim.downloader as api
|
| 34 |
+
|
| 35 |
import gradio as gr
|
| 36 |
import time
|
| 37 |
+
|
| 38 |
+
|
|
|
|
|
|
|
|
|
|
| 39 |
|
| 40 |
|
| 41 |
# Take Rachel as main character
|