]> git.phdru.name Git - m_librarian.git/blobdiff - m_librarian/glst.py
Tests(glst): Fix file name in inline test; print first 5 genres
[m_librarian.git] / m_librarian / glst.py
index cd2b8c90f33a7235c86d7dc9e12887253f07e95f..fedb27b2ed6647fe38b2d8569f7a0483fcad355e 100755 (executable)
@@ -1,14 +1,17 @@
 #! /usr/bin/env python
 
+from __future__ import print_function
 import codecs
+from glob import glob
 import os
 from sqlobject import sqlhub, SQLObjectNotFound
 from .db import Genre
 
+__all__ = ['import_glst']
+
 
 def parse_glst_file(glst_filename):
     glst_file = codecs.open(glst_filename, 'r', 'utf-8')
-    genre_list = []
     try:
         for line in glst_file:
             line = line.strip()
@@ -21,10 +24,9 @@ def parse_glst_file(glst_filename):
                 name, title = parts[1].split(';', 1)
             except (IndexError, ValueError):
                 continue
-            genre_list.append((name, title))
+            yield name, title
     finally:
         glst_file.close()
-    return genre_list
 
 
 def import_glst_file(glst_filename):
@@ -40,20 +42,37 @@ def import_glst_file(glst_filename):
     return old, new
 
 
-def _import_data():
+def _import_glst():
     ml_dir = os.path.dirname(__file__)
-    old_fb2, new_fb2 = import_glst_file(
-        os.path.join(ml_dir, 'data', 'genres_fb2.glst'))
-    old_nonfb2, new_nonfb2 = import_glst_file(
-        os.path.join(ml_dir, 'data', 'genres_nonfb2.glst'))
-    sqlhub.processConnection.query("VACUUM %s" % Genre.sqlmeta.table)
-    return old_fb2 + old_nonfb2, new_fb2 + new_nonfb2
+    count_old = count_new = 0
+    for glst_file in glob(os.path.join(ml_dir, 'glst', '*.glst')):
+        _count_old, _count_new = import_glst_file(glst_file)
+        count_old += _count_old
+        count_new += _count_new
+    connection = sqlhub.processConnection
+    if connection.dbName == 'postgres':
+        connection.query("VACUUM %s" % Genre.sqlmeta.table)
+    return count_old, count_new
 
 
-def import_data():
-    return sqlhub.doInTransaction(_import_data)
+def import_glst():
+    count_old, count_new = sqlhub.doInTransaction(_import_glst)
+    connection = sqlhub.processConnection
+    if connection.dbName == 'sqlite':
+        connection.query("VACUUM")
+    return count_old, count_new
 
 
-if __name__ == '__main__':
+def test():
     ml_dir = os.path.dirname(__file__)
-    print parse_glst_file(os.path.join(ml_dir, 'data', 'genres_fb2.glst'))
+    for i, (name, title) in enumerate(parse_glst_file(
+        os.path.join(ml_dir, 'glst', 'genres_fb2_flibusta.glst')
+    )):
+        if i < 5:
+            print(name, title)
+        else:
+            break
+
+
+if __name__ == '__main__':
+    test()