Spaces:
Sleeping
Sleeping
Update relevance_ranking.py
Browse files- relevance_ranking.py +6 -5
relevance_ranking.py
CHANGED
|
@@ -155,7 +155,7 @@ def keyword_extraction(question):
|
|
| 155 |
for token in words:
|
| 156 |
word = token[0]
|
| 157 |
pos = token[1]
|
| 158 |
-
if
|
| 159 |
keywords += word.lower().split('_')
|
| 160 |
|
| 161 |
keywords = list(set(keywords))
|
|
@@ -165,10 +165,11 @@ def keyword_extraction(question):
|
|
| 165 |
|
| 166 |
def isRelevant(text, keywords):
|
| 167 |
text = text.lower().replace('_',' ')
|
| 168 |
-
for
|
| 169 |
-
|
| 170 |
-
|
| 171 |
-
|
|
|
|
| 172 |
|
| 173 |
def removeDuplicate(documents):
|
| 174 |
mapUnigram = {}
|
|
|
|
| 155 |
for token in words:
|
| 156 |
word = token[0]
|
| 157 |
pos = token[1]
|
| 158 |
+
if word not in stopwords:
|
| 159 |
keywords += word.lower().split('_')
|
| 160 |
|
| 161 |
keywords = list(set(keywords))
|
|
|
|
| 165 |
|
| 166 |
def isRelevant(text, keywords):
|
| 167 |
text = text.lower().replace('_',' ')
|
| 168 |
+
words = list(set([_ for word in keywords for _ in word]))
|
| 169 |
+
for word in words:
|
| 170 |
+
if word in text:
|
| 171 |
+
return True
|
| 172 |
+
return False
|
| 173 |
|
| 174 |
def removeDuplicate(documents):
|
| 175 |
mapUnigram = {}
|