1
0
mirror of synced 2024-11-22 01:04:23 +01:00

<title> is also an html metadata

This commit is contained in:
jvoisin 2019-02-23 20:47:26 +01:00
parent c757a9b7ef
commit 524bae5972

View File

@ -54,7 +54,7 @@ class _HTMLParser(parser.HTMLParser):
we're using an internal queue to track all the opening/closing tags,
and hoping for the best.
"""
tag_blacklist = {'doctitle', 'meta'} # everything is lowercase
tag_blacklist = {'doctitle', 'meta', 'title'} # everything is lowercase
def __init__(self, filename):
super().__init__()
self.filename = filename