X-Git-Url: https://git.phdru.name/?a=blobdiff_plain;f=Robots%2Fparse_html.py;h=678f3e2dae49d9961c07e040aeca2ec7e8e832aa;hb=2f06deff348d6a49ba7f8f0d941e0bd3445e6418;hp=80d4a9243bbbec31b96d98a4881182afefd05361;hpb=38f3645cce7a5875128d788df6631069c761b987;p=bookmarks_db.git diff --git a/Robots/parse_html.py b/Robots/parse_html.py index 80d4a92..678f3e2 100755 --- a/Robots/parse_html.py +++ b/Robots/parse_html.py @@ -119,10 +119,18 @@ def parse_html(filename, charset=None, log=None): if __name__ == '__main__': import sys - from m_lib.defenc import default_encoding - current_charset = default_encoding.replace("windows-", "cp") - parser = parse_html(sys.argv[1], universal_charset, + l = len(sys.argv) + if l == 3: + filename = sys.argv[1] + charset = sys.argv[2] + elif l == 2: + filename = sys.argv[1] + charset = universal_charset + else: + sys.exit("Usage: %s filename [charset]" % sys.argv[0]) + + parser = parse_html(filename, universal_charset, log=lambda s: sys.stdout.write(s + '\n')) print " refresh:", parser.refresh print " icon :", parser.icon