don't include links anymore
This commit is contained in:
parent
43ff74265c
commit
fba3f789bb
|
@ -56,14 +56,6 @@ class FileScanner(HTMLParser):
|
||||||
words_with_usage[word].score += score
|
words_with_usage[word].score += score
|
||||||
return sorted(words_with_usage.values(), key=lambda tag: tag.score, reverse=True)
|
return sorted(words_with_usage.values(), key=lambda tag: tag.score, reverse=True)
|
||||||
|
|
||||||
def handle_starttag(self, tag, attrs):
|
|
||||||
if tag != "a":
|
|
||||||
return
|
|
||||||
for attr_name, attr_value in attrs:
|
|
||||||
if attr_name == "href":
|
|
||||||
self.texte.append(attr_value)
|
|
||||||
break
|
|
||||||
|
|
||||||
def handle_data(self, data):
|
def handle_data(self, data):
|
||||||
self.texte.append(data)
|
self.texte.append(data)
|
||||||
|
|
||||||
|
|
Loading…
Reference in a new issue