X-Git-Url: https://git.phdru.name/?a=blobdiff_plain;f=Robots%2Fparse_html.py;h=cbb45d612f9b33699b6f2d0bbe397b11a3562fe1;hb=f79d81fcd336e913bf0f42f0a6fbdb582de0f3e3;hp=a83585df318afb1602a916a1a17768485a099138;hpb=4fd6d1f55e5e5dbcc0bdc1b933d6e14076316437;p=bookmarks_db.git diff --git a/Robots/parse_html.py b/Robots/parse_html.py index a83585d..cbb45d6 100755 --- a/Robots/parse_html.py +++ b/Robots/parse_html.py @@ -2,7 +2,7 @@ """ HTML Parsers wrapper - Written by Broytman. Copyright (C) 1997-2010 PhiloSoft Design + Written by Broytman. Copyright (C) 1997-2011 PhiloSoft Design """ import codecs @@ -41,6 +41,13 @@ except ImportError: else: parsers.append(parse_html_html5.parse_html) +# ElementTidy often segfaults +#try: +# import parse_html_etreetidy +#except ImportError: +# pass +#else: +# parsers.append(parse_html_etreetidy.parse_html) import re from htmlentitydefs import name2codepoint