import codecs
import os
+import re
+from htmlentitydefs import name2codepoint
from ..compat import unicode
+DEFAULT_CHARSET = "cp1251" # Stupid default for Russian Cyrillic
+parsers = []
+
try:
from . import bkmk_ph_beautifulsoup4
except ImportError:
# else:
# parsers.append(bkmk_ph_etreetidy.parse_html)
-import re
-from htmlentitydefs import name2codepoint
-
universal_charset = "utf-8"
-DEFAULT_CHARSET = "cp1251" # Stupid default for Russian Cyrillic
-
-parsers = []
-
entity_re = re.compile("(&\w+;)")
num_entity_re = re.compile("(&#[0-9]+;)")