Fix(Robots/bkmk_robot_base): Ignore unknown charset

[bookmarks_db.git] / Robots / bkmk_robot_base.py
diff --git a/Robots/bkmk_robot_base.py b/Robots/bkmk_robot_base.py

index 2024ab85efd74594eb4700078f19f7e012ae2b78..1e511d0b48a625e752f337431892ff7872c050bf 100644 (file)
--- a/Robots/bkmk_robot_base.py
+++ b/Robots/bkmk_robot_base.py
@@ -5,7 +5,7 @@ This file is a part of Bookmarks database and Internet robot.
  """
  
  __author__ = "Oleg Broytman <phd@phdru.name>"
-__copyright__ = "Copyright (C) 2000-2023 PhiloSoft Design"
+__copyright__ = "Copyright (C) 2000-2024 PhiloSoft Design"
  __license__ = "GNU GPL"
  
  __all__ = ['robot_base', 'get_error']
@@ -135,8 +135,13 @@ class robot_base(Robot):
                              break
                      content_stripped = content.strip()
                      if content_stripped and charset:
-                        content_stripped = content_stripped.decode(
-                            charset, 'replace')
+                        try:
+                            content_stripped = content_stripped.decode(
+                                charset, 'replace')
+                        except LookupError:
+                            charset = None
+                            self.log("   unknown charset "
+                                     "in Content-Type header")
                      if content_stripped and is_html:
                          parser = parse_html(
                              content_stripped, charset, self.log)
@@ -211,7 +216,7 @@ class robot_base(Robot):
                                                         bookmark.icon
                                                         )
                                  else:
-                                    self.log("   no icon        :"
+                                    self.log("   no icon        : "
                                               "bad content type '%s'"
                                               % content_type
                                               )