X-Git-Url: https://git.phdru.name/?a=blobdiff_plain;f=Robots%2Fparse_html_beautifulsoup.py;h=c8e8f5db54af91c96a439584d09ade66b094de46;hb=5c1c16d3e1a5fdf4ea1ecc6c31f5e4c6a4240bed;hp=e0129fd1d4cb3c7b34f69f8c772946c04afab645;hpb=66ef97e93d66c741926db216c29dad6047c5d7f4;p=bookmarks_db.git diff --git a/Robots/parse_html_beautifulsoup.py b/Robots/parse_html_beautifulsoup.py index e0129fd..c8e8f5d 100644 --- a/Robots/parse_html_beautifulsoup.py +++ b/Robots/parse_html_beautifulsoup.py @@ -23,9 +23,9 @@ def parse_html(filename, charset=None): root = BeautifulSoup(infile, fromEncoding=charset) infile.close() - charset = root.originalEncoding + _charset = root.originalEncoding try: - title = root.html.head.title.string.encode(charset) + title = root.html.head.title.string.encode(_charset) except AttributeError: title = '' @@ -49,8 +49,7 @@ def parse_html(filename, charset=None): else: icon = None - parser = BSoupParser(charset, False, title, refresh, icon) - return parser + return BSoupParser(_charset, _charset == charset, title, refresh, icon) def _find_refresh(Tag): return (Tag.name == "meta") and \