charset = None # ...try charset from HTML
for p in parsers:
- parser = p(filename, charset)
+ charsets = [universal_charset, DEFAULT_CHARSET]
+ if charset not in charsets:
+ charsets.insert(0, charset)
+ parser = None
+ for c in charsets:
+ try:
+ parser = p(filename, c)
+ break
+ except UnicodeEncodeError:
+ pass
if parser:
break
else:
if parser.meta_charset:
if log: log(" META charset : %s" % parser.charset)
else:
- if log: log(" HTTP charset : %s" % parser.charset)
+ if log: log(" guessed charset: %s" % parser.charset)
if log: log(" current charset: %s" % universal_charset)
if log: log(" title : %s" % title)
try: