namnh113 commited on
Commit
542dc66
·
1 Parent(s): 570c54b

Update relevance_ranking.py

Browse files
Files changed (1) hide show
  1. relevance_ranking.py +6 -5
relevance_ranking.py CHANGED
@@ -155,7 +155,7 @@ def keyword_extraction(question):
155
  for token in words:
156
  word = token[0]
157
  pos = token[1]
158
- if pos not in stopwords:
159
  keywords += word.lower().split('_')
160
 
161
  keywords = list(set(keywords))
@@ -165,10 +165,11 @@ def keyword_extraction(question):
165
 
166
  def isRelevant(text, keywords):
167
  text = text.lower().replace('_',' ')
168
- for words in keywords:
169
- if not any(e for e in words if e in text):
170
- return False
171
- return True
 
172
 
173
  def removeDuplicate(documents):
174
  mapUnigram = {}
 
155
  for token in words:
156
  word = token[0]
157
  pos = token[1]
158
+ if word not in stopwords:
159
  keywords += word.lower().split('_')
160
 
161
  keywords = list(set(keywords))
 
165
 
166
  def isRelevant(text, keywords):
167
  text = text.lower().replace('_',' ')
168
+ words = list(set([_ for word in keywords for _ in word]))
169
+ for word in words:
170
+ if word in text:
171
+ return True
172
+ return False
173
 
174
  def removeDuplicate(documents):
175
  mapUnigram = {}