Some sites return empty "html" that consist only of white spaces.
Strip them to get really empty string.
if content_type.startswith(ctype):
is_html = True
break
- if content and is_html:
- parser = parse_html(content, charset, self.log)
+ content_stripped = content.strip()
+ if content_stripped and is_html:
+ parser = parse_html(content_stripped, charset, self.log)
if parser:
bookmark.real_title = parser.title
icon = parser.icon
% (url, timeout)
)
- if not content:
+ if not content_stripped:
self.log(" empty response, no content")
if not is_html:
self.log(" not html")