X-Git-Url: https://git.phdru.name/?a=blobdiff_plain;f=m_librarian%2Fglst.py;h=206dcc40f858a306524ef07e1d2ec68b02269cc7;hb=7b3352daa8d57878f0d727f1a4f4b1f2fc9609da;hp=44ec6121cbeaf6038730f3a5f9c17abf0a99a0d4;hpb=d0a1abea3d89062e8f9b71dd6df45db5d8b84997;p=m_librarian.git diff --git a/m_librarian/glst.py b/m_librarian/glst.py index 44ec612..206dcc4 100755 --- a/m_librarian/glst.py +++ b/m_librarian/glst.py @@ -1,16 +1,18 @@ #! /usr/bin/env python -__all__ = ['import_glst'] - +from __future__ import print_function +from glob import glob import codecs import os + from sqlobject import sqlhub, SQLObjectNotFound from .db import Genre +__all__ = ['import_glst'] + def parse_glst_file(glst_filename): glst_file = codecs.open(glst_filename, 'r', 'utf-8') - genre_list = [] try: for line in glst_file: line = line.strip() @@ -23,10 +25,9 @@ def parse_glst_file(glst_filename): name, title = parts[1].split(';', 1) except (IndexError, ValueError): continue - genre_list.append((name, title)) + yield name, title finally: glst_file.close() - return genre_list def import_glst_file(glst_filename): @@ -44,21 +45,35 @@ def import_glst_file(glst_filename): def _import_glst(): ml_dir = os.path.dirname(__file__) - old_fb2, new_fb2 = import_glst_file( - os.path.join(ml_dir, 'glst', 'genres_fb2.glst')) - old_nonfb2, new_nonfb2 = import_glst_file( - os.path.join(ml_dir, 'glst', 'genres_nonfb2.glst')) - sqlhub.processConnection.query("VACUUM %s" % Genre.sqlmeta.table) - return old_fb2 + old_nonfb2, new_fb2 + new_nonfb2 + count_old = count_new = 0 + for glst_file in glob(os.path.join(ml_dir, 'glst', '*.glst')): + _count_old, _count_new = import_glst_file(glst_file) + count_old += _count_old + count_new += _count_new + connection = sqlhub.processConnection + if connection.dbName == 'postgres': + connection.query("VACUUM %s" % Genre.sqlmeta.table) + return count_old, count_new def import_glst(): - return sqlhub.doInTransaction(_import_glst) + count_old, count_new = sqlhub.doInTransaction(_import_glst) + connection = sqlhub.processConnection + if connection.dbName == 'sqlite': + connection.query("VACUUM") + return count_old, count_new def test(): ml_dir = os.path.dirname(__file__) - print parse_glst_file(os.path.join(ml_dir, 'glst', 'genres_fb2.glst')) + for i, (name, title) in enumerate(parse_glst_file( + os.path.join(ml_dir, 'glst', 'genres_fb2_flibusta.glst') + )): + if i < 5: + print(name, title) + else: + break + if __name__ == '__main__': test()