"""
HTML Parser using BeautifulSoup
- Written by BroytMann. Copyright (C) 2007 PhiloSoft Design
+ Written by BroytMann. Copyright (C) 2007, 2008 PhiloSoft Design
"""
import re
except AttributeError:
return None
+ if head is None:
+ head = root.html # Some sites put TITLE in HTML without HEAD
+
_charset = root.originalEncoding
try:
title = head.title.string.encode(_charset)
except AttributeError:
- return '' # HEAD but no TITLE
+ title = '' # HEAD but no TITLE
+
+ if (not title) and (head is not root.html):
+ # Some sites put TITLE in HTML outside of HEAD
+
+ try:
+ title = root.html.title.string.encode(_charset)
+ except AttributeError:
+ title = '' # no TITLE in HTML too
meta = head.find(_find_refresh, recursive=False)
if meta: