Feat(dotfiles2html.py): Process `mc.ext.ini`

[phdru.name/phdru.name.git] / reindex_blog.py
diff --git a/reindex_blog.py b/reindex_blog.py

index c2e16ce32c35029bb31d05f382f46e4d65e55617..0f1a8f5f9b185fe34ccecbdf8f2b297f3bd0b3d0 100755 (executable)
--- a/reindex_blog.py
+++ b/reindex_blog.py
@@ -2,7 +2,7 @@
  # -*- coding: koi8-r -*-
  
  __author__ = "Oleg Broytman <phd@phdru.name>"
-__copyright__ = "Copyright (C) 2006-2017 PhiloSoft Design"
+__copyright__ = "Copyright (C) 2006-2021 PhiloSoft Design"
  
  import sys, os
  from Cheetah.Template import Template
@@ -482,6 +482,8 @@ class AbsURLHTMLParser(_HTMLParser):
        self.accumulator += '<a'
        for attrname, value in attrs:
           value = cgi.escape(value, True)
+         if isinstance(value, unicode):
+            value = value.encode('koi8-r')
           if attrname == 'href':
              self.accumulator += ' href="%s"' % urljoin(self.base, value)
           else:
@@ -525,9 +527,11 @@ from rss_20 import rss_20
  from news import NewsItem
  
  if blog_root:
-   baseURL = "http://phdru.name/%s/" % blog_root
+   blog_root_url = blog_root[
+        blog_root.find('/htdocs/phdru.name/') + len('/htdocs/phdru.name/'):]
+   baseURL = "https://phdru.name/%s/" % blog_root_url
  else:
-   baseURL = "http://phdru.name/"
+   baseURL = "https://phdru.name/"
  
  items = []
  for item in tuple(reversed(all_titles_tags))[:10]:
@@ -544,8 +548,17 @@ for item in tuple(reversed(all_titles_tags))[:10]:
     item.categoryList = tags
     body = bodies[(year, month, day, file)]
     body = absolute_urls(body, baseURL + url_path)
+   try:
+       body.decode('utf-8')
+   except UnicodeDecodeError:
+       body = body.decode('koi8-r').encode('utf-8')
     item.body = body
-   item.excerpt = get_first_p(body)
+   excerpt = get_first_p(body)
+   try:
+       excerpt.decode('utf-8')
+   except UnicodeDecodeError:
+       excerpt = excerpt.decode('koi8-r').encode('utf-8')
+   item.excerpt = excerpt
  
  namespace = {
     "title": "Oleg Broytman's blog",