X-Git-Url: https://git.phdru.name/?p=bookmarks_db.git;a=blobdiff_plain;f=parse_html%2Fbkmk_parse_html.py;h=af9395b0d8d735689288a02071a0e1aee80814de;hp=fa72e1f2aa14f5296343434895bcf6ccb22e088d;hb=7fc9a9ac1bfa749aa30e3ae1d730ac4f266db950;hpb=be7cec61fa405f38dea2edde623174ca47ca7dc3 diff --git a/parse_html/bkmk_parse_html.py b/parse_html/bkmk_parse_html.py index fa72e1f..af9395b 100644 --- a/parse_html/bkmk_parse_html.py +++ b/parse_html/bkmk_parse_html.py @@ -152,8 +152,15 @@ def parse_html(html_text, charset=None, log=None): try: parser.title = title.encode('ascii') except UnicodeEncodeError: - parser.charset = DEFAULT_CHARSET - parser.title = title.encode(DEFAULT_CHARSET) + try: + parser.title = title.encode(DEFAULT_CHARSET) + except UnicodeEncodeError: + parser.title = title.encode(universal_charset) + parser.charset = universal_charset + else: + parser.charset = DEFAULT_CHARSET + else: + parser.charset = 'ascii' converted_title = title = parser.title if title and (not parser.charset):