ignore excluded words completely
This commit is contained in:
parent
987da2aa95
commit
43ff74265c
1 changed files with 1 additions and 1 deletions
|
@ -43,7 +43,7 @@ class FileScanner(HTMLParser):
|
|||
word = tag_name.lower()
|
||||
score = 10
|
||||
if word in EXCLUDED_WORDS:
|
||||
score = 0
|
||||
continue
|
||||
if word in title_words:
|
||||
score *= 4
|
||||
if len(word) <= 3:
|
||||
|
|
Loading…
Reference in a new issue