X-Git-Url: https://git.phdru.name/?a=blobdiff_plain;f=check_urls.py;h=d6d038d2c624a116c22b60f772260095661909a1;hb=ffdaa8835ae34cd5b9c712d962a5830e0edeed05;hp=f75cb16cc20f47ae769ee6775763e27a1293e9a9;hpb=7fd1132c4ab530b7b34e846ca45f99b8737dd127;p=bookmarks_db.git diff --git a/check_urls.py b/check_urls.py index f75cb16..d6d038d 100755 --- a/check_urls.py +++ b/check_urls.py @@ -1,14 +1,18 @@ #! /usr/bin/env python -""" - Robot interface - check URLs from bookmarks database +"""Robot interface - check URLs from bookmarks database - Written by Broytman. Copyright (C) 2000-2010 PhiloSoft Design. +This file is a part of Bookmarks database and Internet robot. """ - +from __future__ import print_function import sys, os +__author__ = "Oleg Broytman " +__copyright__ = "Copyright (C) 2000-2017 PhiloSoft Design" +__license__ = "GNU GPL" + + def run(): from getopt import getopt optlist, args = getopt(sys.argv[1:], "ise") @@ -30,7 +34,7 @@ def run(): pass if report_stats: - print "Broytman check_urls, Copyright (C) 1997-2010 PhiloSoft Design" + print("Broytman check_urls, Copyright (C) 1997-2017 PhiloSoft Design") if args: sys.stderr.write("check_urls: too many arguments\n") @@ -51,12 +55,12 @@ def run(): log = openlog("check.log") log("chk_urls restarted for errors") if report_stats: - print "chk_urls restarted for errors" + print("chk_urls restarted for errors") else: log = makelog("check.log") log("check_urls started") if report_stats: - print " check_urls: normal start" + print(" check_urls: normal start") from storage import storage storage = storage() @@ -74,7 +78,7 @@ def run(): objects = len(root_folder.linear) if report_stats: - print "Ok" + print("Ok") if report_stats: if only_errors: @@ -102,8 +106,10 @@ def run(): object_count = object_count + 1 if object.isBookmark: - if object.href.startswith('place:'): # Firefox SmartBookmarks - log("Skipped %s" % object.href) + href = object.href + if (href.startswith('place:') # Firefox SmartBookmarks + or '%s' in href): # Bookmark with keyword + log("Skipped %s" % href) continue if only_errors: @@ -112,20 +118,20 @@ def run(): else: continue - if checked.has_key(object.href): - log("Already checked %s" % object.href) - old_object = root_folder.linear[checked[object.href]] + if checked.has_key(href): + log("Already checked %s" % href) + old_object = root_folder.linear[checked[href]] for attr_name in ("last_visit", "last_modified", "error", "no_error", "moved", "size", "md5", "real_title", "last_tested", "test_time", "icon", "charset"): if hasattr(old_object, attr_name): setattr(object, attr_name, getattr(old_object, attr_name)) else: - log("Checking %s" % object.href) + log("Checking %s" % href) rcode = robot.check_url(object) if rcode: - checked[object.href] = object_no + checked[href] = object_no urls_no = urls_no + 1 try: size = size + int(object.size) @@ -140,10 +146,10 @@ def run(): del pbar if report_stats: - print "Ok" - print object_count, "objects passed" - print urls_no, "URLs checked" - print size, "bytes eaten" + print("Ok") + print(object_count, "objects passed") + print(urls_no, "URLs checked") + print(size, "bytes eaten") break_tree(root_folder.linear) storage.store(root_folder)