From: Oleg Broytman Date: Tue, 4 Mar 2008 10:14:56 +0000 (+0000) Subject: I have never saw pages in MacCyriliic. X-Git-Tag: v4.5.3~181 X-Git-Url: https://git.phdru.name/?a=commitdiff_plain;h=3f74e8242f3fb1474ed258d97d791018f3bc1a34;p=bookmarks_db.git I have never saw pages in MacCyriliic. git-svn-id: file:///home/phd/archive/SVN/bookmarks_db/trunk@195 fdd5c36f-1aea-0310-aeeb-c58d7e2b6c23 --- diff --git a/Robots/parse_html_beautifulsoup.py b/Robots/parse_html_beautifulsoup.py index f76f058..632ee9f 100644 --- a/Robots/parse_html_beautifulsoup.py +++ b/Robots/parse_html_beautifulsoup.py @@ -77,7 +77,7 @@ def parse_html(filename, charset=None, log=None): head = html # Some sites put TITLE in HTML without HEAD _charset = root.originalEncoding - if _charset in ("ISO-8859-2", "windows-1252"): # Replace default + if _charset in ("ISO-8859-2", "windows-1252", "MacCyrillic"): # Replace default _charset = DEFAULT_CHARSET try: