X-Git-Url: https://git.phdru.name/?a=blobdiff_plain;ds=sidebyside;f=Robots%2Fparse_html.py;h=137ebfad9809d369712483bfa63b97744f7c6f1a;hb=284b0935fc4237bda2e51229860c771f78887be2;hp=0d7b20b5ce82b88d596b1cb25aac90084a997735;hpb=3a4e6b782c229014a6cc49f1e68681696c1ed1f3;p=bookmarks_db.git diff --git a/Robots/parse_html.py b/Robots/parse_html.py index 0d7b20b..137ebfa 100755 --- a/Robots/parse_html.py +++ b/Robots/parse_html.py @@ -33,7 +33,8 @@ def recode_entities(title, charset): output = [] for part in entity_re.split(title): if entity_re.match(part): - part = entitydefs.get(part[1:-1], part) + if part not in ("&", "<", ">", ""e;", " "): + part = entitydefs.get(part[1:-1], part) output.append(part) output2 = []