X-Git-Url: https://git.phdru.name/?a=blobdiff_plain;f=Robots%2Fparse_html_beautifulsoup.py;h=f76f058f2578aabe430c2c403f919dad87c84b9d;hb=f0f6bb16244c97ca07645367b66d2454fcd7cfc3;hp=162e7a37dabd218df12aaf14e50c14e70f778177;hpb=d4d9255c90fb65adf5a8d8d03b55d558b77fe756;p=bookmarks_db.git diff --git a/Robots/parse_html_beautifulsoup.py b/Robots/parse_html_beautifulsoup.py index 162e7a3..f76f058 100644 --- a/Robots/parse_html_beautifulsoup.py +++ b/Robots/parse_html_beautifulsoup.py @@ -77,7 +77,7 @@ def parse_html(filename, charset=None, log=None): head = html # Some sites put TITLE in HTML without HEAD _charset = root.originalEncoding - if _charset == "windows-1252": # Replace default + if _charset in ("ISO-8859-2", "windows-1252"): # Replace default _charset = DEFAULT_CHARSET try: