Spaces:
Sleeping
Sleeping
Update relevance_ranking.py
Browse files- relevance_ranking.py +6 -5
relevance_ranking.py
CHANGED
@@ -155,7 +155,7 @@ def keyword_extraction(question):
|
|
155 |
for token in words:
|
156 |
word = token[0]
|
157 |
pos = token[1]
|
158 |
-
if
|
159 |
keywords += word.lower().split('_')
|
160 |
|
161 |
keywords = list(set(keywords))
|
@@ -165,10 +165,11 @@ def keyword_extraction(question):
|
|
165 |
|
166 |
def isRelevant(text, keywords):
|
167 |
text = text.lower().replace('_',' ')
|
168 |
-
for
|
169 |
-
|
170 |
-
|
171 |
-
|
|
|
172 |
|
173 |
def removeDuplicate(documents):
|
174 |
mapUnigram = {}
|
|
|
155 |
for token in words:
|
156 |
word = token[0]
|
157 |
pos = token[1]
|
158 |
+
if word not in stopwords:
|
159 |
keywords += word.lower().split('_')
|
160 |
|
161 |
keywords = list(set(keywords))
|
|
|
165 |
|
166 |
def isRelevant(text, keywords):
|
167 |
text = text.lower().replace('_',' ')
|
168 |
+
words = list(set([_ for word in keywords for _ in word]))
|
169 |
+
for word in words:
|
170 |
+
if word in text:
|
171 |
+
return True
|
172 |
+
return False
|
173 |
|
174 |
def removeDuplicate(documents):
|
175 |
mapUnigram = {}
|