ignore excluded words completely
This commit is contained in:
parent
987da2aa95
commit
43ff74265c
|
@ -43,7 +43,7 @@ class FileScanner(HTMLParser):
|
||||||
word = tag_name.lower()
|
word = tag_name.lower()
|
||||||
score = 10
|
score = 10
|
||||||
if word in EXCLUDED_WORDS:
|
if word in EXCLUDED_WORDS:
|
||||||
score = 0
|
continue
|
||||||
if word in title_words:
|
if word in title_words:
|
||||||
score *= 4
|
score *= 4
|
||||||
if len(word) <= 3:
|
if len(word) <= 3:
|
||||||
|
|
Loading…
Reference in a new issue