X-Git-Url: https://git.phdru.name/?p=bookmarks_db.git;a=blobdiff_plain;f=check_urls.py;h=e2dac0ff3c516a65ed9f23b22d37ce050bbe6030;hp=057e023e7eb675026b85ec7f364bc988431e2ca4;hb=96e39d55c791326368ff14d538850e14ba5a2c97;hpb=f15f53958b9f6192bd4c3ae9cf1bf0a039e7f3f7 diff --git a/check_urls.py b/check_urls.py index 057e023..e2dac0f 100755 --- a/check_urls.py +++ b/check_urls.py @@ -1,13 +1,14 @@ #! /usr/bin/env python -""" - Robot interface - check URLs from bookmarks database +"""Robot interface - check URLs from bookmarks database - Written by BroytMann. Copyright (C) 2000-2007 PhiloSoft Design. +This file is a part of Bookmarks database and Internet robot. """ +__author__ = "Oleg Broytman " +__copyright__ = "Copyright (C) 2000-2012 PhiloSoft Design" +__license__ = "GNU GPL" -import sys, os, tempfile -tempfname = "check_urls" + tempfile.gettempprefix() + "tmp" +import sys, os def run(): @@ -31,7 +32,7 @@ def run(): pass if report_stats: - print "BroytMann check_urls, Copyright (C) 1997-2007 PhiloSoft Design" + print "Broytman check_urls, Copyright (C) 1997-2010 PhiloSoft Design" if args: sys.stderr.write("check_urls: too many arguments\n") @@ -63,7 +64,7 @@ def run(): storage = storage() from robots import robot - robot = robot(tempfname, log) + robot = robot(log) if report_stats: sys.stdout.write("Loading %s: " % storage.filename) @@ -103,26 +104,32 @@ def run(): object_count = object_count + 1 if object.isBookmark: + href = object.href + if (href.startswith('place:') # Firefox SmartBookmarks + or '%s' in href): # Bookmark with keyword + log("Skipped %s" % href) + continue + if only_errors: if hasattr(object, "error"): delattr(object, "error") else: continue - if checked.has_key(object.href): - log("Already checked %s" % object.href) - old_object = root_folder.linear[checked[object.href]] + if checked.has_key(href): + log("Already checked %s" % href) + old_object = root_folder.linear[checked[href]] for attr_name in ("last_visit", "last_modified", "error", "no_error", "moved", "size", "md5", "real_title", "last_tested", "test_time", "icon", "charset"): if hasattr(old_object, attr_name): setattr(object, attr_name, getattr(old_object, attr_name)) else: - log("Checking %s" % object.href) + log("Checking %s" % href) rcode = robot.check_url(object) if rcode: - checked[object.href] = object_no + checked[href] = object_no urls_no = urls_no + 1 try: size = size + int(object.size) @@ -149,11 +156,6 @@ def run(): log("check_urls finished ok") log.close() - try: - os.unlink(tempfname) - except os.error: - pass - if __name__ == '__main__': run()