1
0
mirror of synced 2024-11-25 18:54:22 +01:00

<title> is also an html metadata

This commit is contained in:
jvoisin 2019-02-23 20:47:26 +01:00
parent c757a9b7ef
commit 524bae5972

View File

@ -54,7 +54,7 @@ class _HTMLParser(parser.HTMLParser):
we're using an internal queue to track all the opening/closing tags, we're using an internal queue to track all the opening/closing tags,
and hoping for the best. and hoping for the best.
""" """
tag_blacklist = {'doctitle', 'meta'} # everything is lowercase tag_blacklist = {'doctitle', 'meta', 'title'} # everything is lowercase
def __init__(self, filename): def __init__(self, filename):
super().__init__() super().__init__()
self.filename = filename self.filename = filename