import codecs
import os
+import re
+from htmlentitydefs import name2codepoint
+
+from compat import unicode, unichr
+
+DEFAULT_CHARSET = "cp1251" # Stupid default for Russian Cyrillic
+parsers = []
try:
from . import bkmk_ph_beautifulsoup4
# else:
# parsers.append(bkmk_ph_etreetidy.parse_html)
-import re
-from htmlentitydefs import name2codepoint
-
universal_charset = "utf-8"
-DEFAULT_CHARSET = "cp1251" # Stupid default for Russian Cyrillic
-
-parsers = []
-
-entity_re = re.compile("(&\w+;)")
+entity_re = re.compile("(&\\w+;)")
num_entity_re = re.compile("(&#[0-9]+;)")