]> git.phdru.name Git - m_librarian.git/blob - m_librarian/inp.py
Process author names
[m_librarian.git] / m_librarian / inp.py
1
2 __all__ = ['import_inpx']
3
4 import os
5 from zipfile import ZipFile
6 from sqlobject import sqlhub, SQLObjectNotFound
7 from .db import Author, Book, Extension, Genre, Language, \
8     insert_name, insert_author
9
10
11 EOT = chr(4)  # INP field separator
12
13
14 def split_line(line):
15     parts = line.strip().split(EOT)
16     l = len(parts)
17     if l < 11:
18         raise ValueError('Unknown INP structure: "%s"' % line)
19     if l == 11:  # Standard structure
20         parts.append(None)  # Emulate lang
21     else:  # New structure
22         parts = parts[:12]
23     return parts
24
25
26 def import_inp_line(archive, parts):
27     authors, genres, title, series, ser_no, file, size, lib_id, deleted, \
28         extension, date, language = parts
29     try:
30         Book.archive_file_idx.get(archive, file)
31     except SQLObjectNotFound:
32         pass
33     else:
34         return
35     try:
36         ser_no = int(ser_no)
37     except ValueError:
38         ser_no = None
39     size = int(size)
40     deleted = deleted == '1'
41     extension_row = insert_name(Extension, extension)
42     language_row = insert_name(Language, language)
43     book = Book(title=title, series=series, ser_no=ser_no,
44                 archive=archive, file=file, size=size,
45                 lib_id=lib_id, deleted=deleted,
46                 extension=extension_row, date=date,
47                 language=language_row)
48     for author in authors.split(':'):
49         if author:
50             alist = author.split(',', 2)
51             surname = alist[0]
52             if len(alist) > 1:
53                 name = alist[1]
54                 if len(alist) == 3:
55                     misc_name = alist[2]
56                 else:
57                     misc_name = ''
58             else:
59                 name = misc_name = ''
60             author_row = insert_author(surname, name, misc_name)
61             book.addAuthor(author_row)
62     for genre in genres.split(':'):
63         if genre:
64             genre_row = insert_name(Genre, genre, title=genre)
65             book.addGenre(genre_row)
66
67
68 def import_inp(archive, inp):
69     for line in inp:
70         import_inp_line(archive, split_line(line))
71
72
73 def import_inpx(path):
74     inpx = ZipFile(path)
75     for name in inpx.namelist():
76         archive, ext = os.path.splitext(name)
77         if ext != '.inp':
78             continue
79         inp = inpx.open(name)
80         sqlhub.doInTransaction(import_inp, archive + '.zip', inp)
81         inp.close()
82     connection = sqlhub.processConnection
83     if connection.dbName in ('postgres', 'sqlite'):
84         for table in Author, Book, Extension, Genre, Language:
85             connection.query("VACUUM %s" % table.sqlmeta.table)