#969: generate txt files during publication
[wolnelektury.git] / apps / catalogue / management / commands / importbooks.py
1 # -*- coding: utf-8 -*-
2 # This file is part of Wolnelektury, licensed under GNU Affero GPLv3 or later.
3 # Copyright © Fundacja Nowoczesna Polska. See NOTICE for more information.
4 #
5 import os
6 import sys
7 import time
8 from optparse import make_option
9
10 from django.core.management.base import BaseCommand
11 from django.core.management.color import color_style
12 from django.core.files import File
13
14 from catalogue.models import Book
15
16
17 class Command(BaseCommand):
18     option_list = BaseCommand.option_list + (
19         make_option('-q', '--quiet', action='store_false', dest='verbose', default=True,
20             help='Verbosity level; 0=minimal output, 1=normal output, 2=all output'),
21         make_option('-f', '--force', action='store_true', dest='force', default=False,
22             help='Print status messages to stdout'),
23         make_option('-E', '--no-build-epub', action='store_false', dest='build_epub', default=True,
24             help='Don\'t build EPUB file'),
25         make_option('-T', '--no-build-txt', action='store_false', dest='build_txt', default=True,
26             help='Don\'t build TXT file'),
27         make_option('-w', '--wait-until', dest='wait_until', metavar='TIME',
28             help='Wait until specified time (Y-M-D h:m:s)'),
29     )
30     help = 'Imports books from the specified directories.'
31     args = 'directory [directory ...]'
32
33     def handle(self, *directories, **options):
34         from django.db import transaction
35
36         self.style = color_style()
37
38         verbose = options.get('verbose')
39         force = options.get('force')
40         show_traceback = options.get('traceback', False)
41
42         if options.get('wait_until'):
43             wait_until = time.mktime(time.strptime(options.get('wait_until'), '%Y-%m-%d %H:%M:%S'))
44             if verbose > 0:
45                 print "Will wait until %s; it's %f seconds from now" % (
46                     time.strftime('%Y-%m-%d %H:%M:%S', 
47                     time.localtime(wait_until)), wait_until - time.time())
48
49         # Start transaction management.
50         transaction.commit_unless_managed()
51         transaction.enter_transaction_management()
52         transaction.managed(True)
53
54         files_imported = 0
55         files_skipped = 0
56
57         for dir_name in directories:
58             if not os.path.isdir(dir_name):
59                 print self.style.ERROR("%s: Not a directory. Skipping." % dir_name)
60             else:
61                 # files queue
62                 files = sorted(os.listdir(dir_name))
63                 postponed = {}
64                 while files:
65                     file_name = files.pop(0)
66                     file_path = os.path.join(dir_name, file_name)
67                     file_base, ext = os.path.splitext(file_path)
68
69                     # Skip files that are not XML files
70                     if not ext == '.xml':
71                         continue
72
73                     if verbose > 0:
74                         print "Parsing '%s'" % file_path
75                     else:
76                         sys.stdout.write('.')
77                         sys.stdout.flush()
78
79                     # Import book files
80                     try:
81                         book = Book.from_xml_file(file_path, overwrite=force, 
82                                                   build_epub=options.get('build_epub'),
83                                                   build_txt=options.get('build_txt'))
84                         files_imported += 1
85
86                         if os.path.isfile(file_base + '.pdf'):
87                             book.pdf_file.save('%s.pdf' % book.slug, File(file(file_base + '.pdf')))
88                             if verbose:
89                                 print "Importing %s.pdf" % file_base
90                         if os.path.isfile(file_base + '.epub'):
91                             book.epub_file.save('%s.epub' % book.slug, File(file(file_base + '.epub')))
92                             if verbose:
93                                 print "Importing %s.epub" % file_base
94                         if os.path.isfile(file_base + '.odt'):
95                             book.odt_file.save('%s.odt' % book.slug, File(file(file_base + '.odt')))
96                             if verbose:
97                                 print "Importing %s.odt" % file_base
98                         if os.path.isfile(file_base + '.txt'):
99                             book.txt_file.save('%s.txt' % book.slug, File(file(file_base + '.txt')))
100                             if verbose:
101                                 print "Importing %s.txt" % file_base
102                         if os.path.isfile(os.path.join(dir_name, book.slug + '.mp3')):
103                             book.mp3_file.save('%s.mp3' % book.slug, File(file(os.path.join(dir_name, book.slug + '.mp3'))))
104                             if verbose:
105                                 print "Importing %s.mp3" % book.slug
106                         if os.path.isfile(os.path.join(dir_name, book.slug + '.ogg')):
107                             book.ogg_file.save('%s.ogg' % book.slug, File(file(os.path.join(dir_name, book.slug + '.ogg'))))
108                             if verbose:
109                                 print "Importing %s.ogg" % book.slug
110                         if os.path.isfile(os.path.join(dir_name, book.slug + '.daisy.zip')):
111                             book.ogg_file.save('%s.daisy.zip' % book.slug, File(file(os.path.join(dir_name, book.slug + '.daisy.zip'))))
112                             if verbose:
113                                 print "Importing %s.daisy.zip" % book.slug
114
115                         book.save()
116
117                     except Book.AlreadyExists, msg:
118                         print self.style.ERROR('%s: Book already imported. Skipping. To overwrite use --force.' %
119                             file_path)
120                         files_skipped += 1
121
122                     except Book.DoesNotExist, e:
123                         if file_name not in postponed or postponed[file_name] < files_imported:
124                             # push it back into the queue, maybe the missing child will show up
125                             if verbose:
126                                 print self.style.NOTICE('Waiting for missing children')
127                             files.append(file_name)
128                             postponed[file_name] = files_imported
129                         else:
130                             # we're in a loop, nothing's being imported - some child is really missing
131                             raise e
132
133         # Print results
134         print
135         print "Results: %d files imported, %d skipped, %d total." % (
136             files_imported, files_skipped, files_imported + files_skipped)
137         print
138
139         if wait_until:
140             print 'Waiting...'
141             try:
142                 time.sleep(wait_until - time.time())
143             except IOError:
144                 print "it's already too late"
145
146         transaction.commit()
147         transaction.leave_transaction_management()
148