3 Robot interface - check URLs from bookmarks database
5 Written by Broytman. Copyright (C) 2000-2010 PhiloSoft Design.
13 from getopt import getopt
14 optlist, args = getopt(sys.argv[1:], "ise")
20 for _opt, _arg in optlist:
33 print "Broytman check_urls, Copyright (C) 1997-2010 PhiloSoft Design"
36 sys.stderr.write("check_urls: too many arguments\n")
37 sys.stderr.write("Usage: check_urls [-ise]\n")
41 show_pbar = sys.stderr.isatty()
45 from m_lib.pbar.tty_pbar import ttyProgressBar
49 from m_lib.flog import makelog, openlog
51 log = openlog("check.log")
52 log("chk_urls restarted for errors")
54 print "chk_urls restarted for errors"
56 log = makelog("check.log")
57 log("check_urls started")
59 print " check_urls: normal start"
61 from storage import storage
64 from robots import robot
68 sys.stdout.write("Loading %s: " % storage.filename)
71 root_folder = storage.load()
72 from bkmk_objects import make_linear, break_tree
73 make_linear(root_folder)
74 objects = len(root_folder.linear)
81 s = "Rechecking errors: "
88 pbar = ttyProgressBar(0, objects)
97 for object_no in range(objects):
99 pbar.display(object_no+1)
101 object = root_folder.linear[object_no]
102 object_count = object_count + 1
104 if object.isBookmark:
105 if object.href.startswith('place:'): # Firefox SmartBookmarks
106 log("Skipped %s" % object.href)
110 if hasattr(object, "error"):
111 delattr(object, "error")
115 if checked.has_key(object.href):
116 log("Already checked %s" % object.href)
117 old_object = root_folder.linear[checked[object.href]]
118 for attr_name in ("last_visit", "last_modified",
119 "error", "no_error", "moved", "size", "md5", "real_title",
120 "last_tested", "test_time", "icon", "charset"):
121 if hasattr(old_object, attr_name):
122 setattr(object, attr_name, getattr(old_object, attr_name))
124 log("Checking %s" % object.href)
125 rcode = robot.check_url(object)
128 checked[object.href] = object_no
129 urls_no = urls_no + 1
131 size = size + int(object.size)
132 except (AttributeError, TypeError, ValueError):
133 pass # Some object does not have a size :(
135 log("Interrupted by user (^C)")
144 print object_count, "objects passed"
145 print urls_no, "URLs checked"
146 print size, "bytes eaten"
148 break_tree(root_folder.linear)
149 storage.store(root_folder)
152 log("check_urls finished ok")
156 if __name__ == '__main__':