X-Git-Url: https://git.phdru.name/?a=blobdiff_plain;f=bkmk_parser.py;h=90b33b37a711a415e2611776f3646ae721318250;hb=1e2f258f40c74803df6746e7b6041776ba715f4b;hp=e3b3db02532567aef8060c4546f1f3a6af6039e2;hpb=c9cfb54ef36e77aee7187e4533f063d407073ad8;p=bookmarks_db.git diff --git a/bkmk_parser.py b/bkmk_parser.py index e3b3db0..90b33b3 100644 --- a/bkmk_parser.py +++ b/bkmk_parser.py @@ -15,7 +15,7 @@ __all__ = ['BkmkParser'] import sys, os from m_lib.net.www.html import HTMLParser -from bkmk_objects import Folder, Bookmark, Ruler +from bkmk_objects import DEFAULT_CHARSET, Folder, Bookmark, Ruler DEBUG = os.environ.has_key("BKMK_DEBUG") @@ -37,8 +37,6 @@ else: dump_names = debug -DEFAULT_CHARSET = None - class BkmkParser(HTMLParser): def __init__(self): HTMLParser.__init__(self) @@ -46,12 +44,12 @@ class BkmkParser(HTMLParser): self.urls = 0 self.objects = 0 - self.charset = "" + self.charset = None self.recode = None def handle_data(self, data): if data: - if DEFAULT_CHARSET: + if self.charset and DEFAULT_CHARSET: data = unicode(data, self.charset, "replace").encode(DEFAULT_CHARSET, "xmlcharrefreplace") self.accumulator += data @@ -73,16 +71,6 @@ class BkmkParser(HTMLParser): self.charset = content.split('=')[1] except IndexError: pass - else: - global DEFAULT_CHARSET - DEFAULT_CHARSET = sys.getdefaultencoding() - if DEFAULT_CHARSET == "ascii": - try: - import locale - except ImportError: - pass - else: - DEFAULT_CHARSET = locale.getpreferredencoding() def start_title(self, attrs): if DEFAULT_CHARSET: