From 3a680d85d6797a14cfed5e6df1d7b75ef1a516ee Mon Sep 17 00:00:00 2001 From: Oleg Broytman Date: Mon, 25 Feb 2008 02:44:02 +0000 Subject: [PATCH]   is an entity that needs to be encoded. git-svn-id: file:///home/phd/archive/SVN/bookmarks_db/trunk@185 fdd5c36f-1aea-0310-aeeb-c58d7e2b6c23 --- Robots/parse_html.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/Robots/parse_html.py b/Robots/parse_html.py index 680ad55..038cfaf 100755 --- a/Robots/parse_html.py +++ b/Robots/parse_html.py @@ -32,7 +32,7 @@ num_entity_re = re.compile("(&#[0-9]+;)") def recode_entities(title, charset): output = [] for part in entity_re.split(title): - if part not in ("&", "<", ">", ""e;", " ") and \ + if part not in ("&", "<", ">", ""e;") and \ entity_re.match(part): part = unichr(name2codepoint.get(part[1:-1], part)).encode(charset) output.append(part) -- 2.39.5