X-Git-Url: https://git.mdrn.pl/wolnelektury.git/blobdiff_plain/d4d849867aedf29df6cd3d764fa5bd9c0f6e8c76..3ba4d1e44766528f0f5b99a825243dd976a7f03c:/src/catalogue/management/commands/eisbn_csv.py diff --git a/src/catalogue/management/commands/eisbn_csv.py b/src/catalogue/management/commands/eisbn_csv.py index ec1333203..4e8f5e4aa 100644 --- a/src/catalogue/management/commands/eisbn_csv.py +++ b/src/catalogue/management/commands/eisbn_csv.py @@ -11,7 +11,7 @@ from catalogue.models import Book from librarian import RDFNS, DCNS -FORMATS = ('HTML', 'PDF', 'TXT', 'EPUB', 'MOBI') +FORMATS = ('PDF', 'HTML', 'TXT', 'EPUB', 'MOBI') FORMATS_WITH_CHILDREN = ('PDF', 'EPUB', 'MOBI') @@ -37,25 +37,43 @@ def is_institution(name): return name.startswith(u'Zgromadzenie Ogólne') +VOLUME_SEPARATORS = (u'. część ', u', część ', u', tom ', u'. der tragödie ') + + +def get_volume(title): + for volume_separator in VOLUME_SEPARATORS: + if volume_separator in title.lower(): + vol_idx = title.lower().index(volume_separator) + stripped = title[:vol_idx] + vol_name = title[vol_idx + 2:] + return stripped, vol_name + return title, '' + + class Command(BaseCommand): @staticmethod def dc_values(desc, tag): return [e.text for e in desc.findall('.//' + DCNS(tag))] def handle(self, *args, **options): + slugs = [line.strip() for line in sys.stdin] writer = csv.writer(sys.stdout) - for book in Book.objects.all(): - desc = book.wldocument().edoc.find('.//' + RDFNS('Description')) - formats = FORMATS_WITH_CHILDREN if book.children.exists() else FORMATS - for file_format in formats: - imprint = u'Fundacja Nowoczesna Polska' - title = book.title + all_books = Book.objects.filter(slug__in=slugs) + books_without_children = all_books.filter(children=None) + for file_format in FORMATS: + if file_format in FORMATS_WITH_CHILDREN: + books = all_books + else: + books = books_without_children + for book in books: + desc = book.wldocument().edoc.find('.//' + RDFNS('Description')) + imprint = '; '.join(self.dc_values(desc, 'publisher')) + title, volume = get_volume(book.title) subtitle = '' year = '' - volume = '' publication_date = localtime(book.created_at).date().isoformat() info_date = publication_date - author = '; '.join(self.dc_values(desc, 'creator')) + author = '; '.join(author.strip() for author in self.dc_values(desc, 'creator')) author_person = author if not is_institution(author) else '' author_institution = author if is_institution(author) else '' publication_type = 'DGO' @@ -78,5 +96,7 @@ class Command(BaseCommand): product_form1, product_form2, language, + book.slug, + file_format, ] writer.writerow([s.encode('utf-8') for s in row])