]> git.phdru.name Git - bookmarks_db.git/commitdiff
Fixed parsing in case of unknown entity.
authorOleg Broytman <phd@phdru.name>
Sun, 8 Aug 2010 19:52:35 +0000 (19:52 +0000)
committerOleg Broytman <phd@phdru.name>
Sun, 8 Aug 2010 19:52:35 +0000 (19:52 +0000)
git-svn-id: file:///home/phd/archive/SVN/bookmarks_db/trunk@243 fdd5c36f-1aea-0310-aeeb-c58d7e2b6c23

Robots/parse_html.py

index 80c7aa89d28efed06db8a598088303f44d2b338b..fd8dc927c0d78d7adcd8394457774450ff9dd403 100755 (executable)
@@ -34,8 +34,12 @@ def recode_entities(title, charset):
    for part in entity_re.split(title):
       if part not in ("&amp;", "&lt;", "&gt;", "&quot;") and \
             entity_re.match(part):
-         part = unichr(name2codepoint.get(part[1:-1], part)).encode(charset)
-      output.append(part)
+         _part = name2codepoint.get(part[1:-1], None)
+         if _part is None:
+             _part = part
+         else:
+             _part = unichr(_part).encode(charset)
+      output.append(_part)
    title = ''.join(output)
 
    output = []