import codecs
-
-universal_charset = "utf-8"
-DEFAULT_CHARSET = "cp1251" # Stupid default for Russian Cyrillic
-
-parsers = []
+import os
try:
from . import bkmk_ph_beautifulsoup4
import re
from htmlentitydefs import name2codepoint
+universal_charset = "utf-8"
+DEFAULT_CHARSET = "cp1251" # Stupid default for Russian Cyrillic
+
+parsers = []
+
entity_re = re.compile("(&\w+;)")
num_entity_re = re.compile("(&#[0-9]+;)")
return ''.join(output)
-import os
BKMK_DEBUG_HTML_PARSERS = os.environ.get("BKMK_DEBUG_HTML_PARSERS")