]> git.phdru.name Git - bookmarks_db.git/commitdiff
I have never saw pages in MacCyriliic.
authorOleg Broytman <phd@phdru.name>
Tue, 4 Mar 2008 10:14:56 +0000 (10:14 +0000)
committerOleg Broytman <phd@phdru.name>
Tue, 4 Mar 2008 10:14:56 +0000 (10:14 +0000)
git-svn-id: file:///home/phd/archive/SVN/bookmarks_db/trunk@195 fdd5c36f-1aea-0310-aeeb-c58d7e2b6c23

Robots/parse_html_beautifulsoup.py

index f76f058f2578aabe430c2c403f919dad87c84b9d..632ee9f15cfaafec9a9f14ac8135354af655efac 100644 (file)
@@ -77,7 +77,7 @@ def parse_html(filename, charset=None, log=None):
       head = html # Some sites put TITLE in HTML without HEAD
 
    _charset = root.originalEncoding
-   if _charset in ("ISO-8859-2", "windows-1252"): # Replace default
+   if _charset in ("ISO-8859-2", "windows-1252", "MacCyrillic"): # Replace default
       _charset = DEFAULT_CHARSET
 
    try: