X-Git-Url: https://git.phdru.name/?a=blobdiff_plain;f=parse_html%2Fbkmk_ph_htmlparser.py;h=0798467386bda9ab993df160f1d4937b1e1802d9;hb=7a40a1b3d6d3824beed843c53ddf13994936674a;hp=d7020b03e933a9d822c541fe9c3936a5e0310ee1;hpb=1249f2d538e9d679421d7bbb59dfac33fad537f4;p=bookmarks_db.git diff --git a/parse_html/bkmk_ph_htmlparser.py b/parse_html/bkmk_ph_htmlparser.py index d7020b0..0798467 100644 --- a/parse_html/bkmk_ph_htmlparser.py +++ b/parse_html/bkmk_ph_htmlparser.py @@ -1,10 +1,11 @@ """HTML Parser using Pythons' HTMLParser This file is a part of Bookmarks database and Internet robot. + """ __author__ = "Oleg Broytman " -__copyright__ = "Copyright (C) 1997-2013 PhiloSoft Design" +__copyright__ = "Copyright (C) 1997-2014 PhiloSoft Design" __license__ = "GNU GPL" __all__ = ['parse_html'] @@ -79,17 +80,13 @@ class HTMLParser(_HTMLParser): self.icon = href -def parse_html(filename, charset=None, log=None): - infile = open(filename, 'r') +def parse_html(html_text, charset=None, log=None): parser = HTMLParser(charset) - for line in infile: - try: - parser.feed(line) - except (HTMLParseError, HTMLHeadDone): - break - - infile.close() + try: + parser.feed(html_text) + except (HTMLParseError, HTMLHeadDone): + pass try: parser.close()