X-Git-Url: https://git.phdru.name/?a=blobdiff_plain;f=m_librarian%2Fglst.py;h=fedb27b2ed6647fe38b2d8569f7a0483fcad355e;hb=10f50ecc606a84ead65526f78a9544996f8e6ccd;hp=6ff58de3d93fef990806ce1e4638d8ec5299ed21;hpb=75821715e295abf0f67faaf80be3f03ac939d47c;p=m_librarian.git diff --git a/m_librarian/glst.py b/m_librarian/glst.py index 6ff58de..fedb27b 100755 --- a/m_librarian/glst.py +++ b/m_librarian/glst.py @@ -1,14 +1,17 @@ #! /usr/bin/env python +from __future__ import print_function import codecs +from glob import glob import os from sqlobject import sqlhub, SQLObjectNotFound from .db import Genre +__all__ = ['import_glst'] + def parse_glst_file(glst_filename): glst_file = codecs.open(glst_filename, 'r', 'utf-8') - genre_list = [] try: for line in glst_file: line = line.strip() @@ -21,10 +24,9 @@ def parse_glst_file(glst_filename): name, title = parts[1].split(';', 1) except (IndexError, ValueError): continue - genre_list.append((name, title)) + yield name, title finally: glst_file.close() - return genre_list def import_glst_file(glst_filename): @@ -40,23 +42,37 @@ def import_glst_file(glst_filename): return old, new -def _import_data(): +def _import_glst(): ml_dir = os.path.dirname(__file__) - old_fb2, new_fb2 = import_glst_file( - os.path.join(ml_dir, 'data', 'genres_fb2.glst')) - old_nonfb2, new_nonfb2 = import_glst_file( - os.path.join(ml_dir, 'data', 'genres_nonfb2.glst')) - sqlhub.processConnection.query("VACUUM %s" % Genre.sqlmeta.table) - return old_fb2 + old_nonfb2, new_fb2 + new_nonfb2 + count_old = count_new = 0 + for glst_file in glob(os.path.join(ml_dir, 'glst', '*.glst')): + _count_old, _count_new = import_glst_file(glst_file) + count_old += _count_old + count_new += _count_new + connection = sqlhub.processConnection + if connection.dbName == 'postgres': + connection.query("VACUUM %s" % Genre.sqlmeta.table) + return count_old, count_new -def import_data(): - return sqlhub.doInTransaction(_import_data) +def import_glst(): + count_old, count_new = sqlhub.doInTransaction(_import_glst) + connection = sqlhub.processConnection + if connection.dbName == 'sqlite': + connection.query("VACUUM") + return count_old, count_new def test(): ml_dir = os.path.dirname(__file__) - print parse_glst_file(os.path.join(ml_dir, 'data', 'genres_fb2.glst')) + for i, (name, title) in enumerate(parse_glst_file( + os.path.join(ml_dir, 'glst', 'genres_fb2_flibusta.glst') + )): + if i < 5: + print(name, title) + else: + break + if __name__ == '__main__': test()