return None
_charset = root.originalEncoding
- if _charset in ("ISO-8859-2", "windows-1252", "MacCyrillic"): # Replace default
+ if _charset in ("ISO-8859-2", "windows-1252", "MacCyrillic"):
+ # Replace with default and re-parse
_charset = DEFAULT_CHARSET
root = _parse_html(html_text, _charset)
if root is None:
try:
meta_content = meta.get("content")
if meta_content:
- __charset = meta_content.lower().split('charset=')[1].split(';')[0]
+ __charset = meta_content.lower().split('charset=')[1].\
+ split(';')[0]
else:
__charset = False
except IndexError: # No charset in the META Content-Type