Filter menu items
[wolnelektury.git] / apps / catalogue / management / commands / importbooks.py
1 # -*- coding: utf-8 -*-
2 # This file is part of Wolnelektury, licensed under GNU Affero GPLv3 or later.
3 # Copyright © Fundacja Nowoczesna Polska. See NOTICE for more information.
4 #
5 import os
6 import sys
7 import time
8 from optparse import make_option
9 from django.conf import settings
10 from django.core.management.base import BaseCommand
11 from django.core.management.color import color_style
12 from django.core.files import File
13 from catalogue.utils import trim_query_log
14 from librarian.picture import ImageStore
15 from wolnelektury_core.management.profile import profile
16
17 from catalogue.models import Book
18 from picture.models import Picture
19
20 from search import Index
21
22
23 class Command(BaseCommand):
24     option_list = BaseCommand.option_list + (
25         make_option('-q', '--quiet', action='store_false', dest='verbose', default=True,
26             help='Verbosity level; 0=minimal output, 1=normal output, 2=all output'),
27         make_option('-f', '--force', action='store_true', dest='force', default=False,
28             help='Overwrite works already in the catalogue'),
29         make_option('-D', '--dont-build', dest='dont_build',
30             metavar="FORMAT,...",
31             help="Skip building specified formats"),
32         make_option('-S', '--no-search-index', action='store_false', dest='search_index', default=True,
33             help='Skip indexing imported works for search'),
34         make_option('-w', '--wait-until', dest='wait_until', metavar='TIME',
35             help='Wait until specified time (Y-M-D h:m:s)'),
36         make_option('-p', '--picture', action='store_true', dest='import_picture', default=False,
37             help='Import pictures'),
38     )
39     help = 'Imports books from the specified directories.'
40     args = 'directory [directory ...]'
41
42     def import_book(self, file_path, options):
43         verbose = options.get('verbose')
44         if options.get('dont_build'):
45             dont_build = options.get('dont_build').lower().split(',')
46         else:
47             dont_build = None
48         file_base, ext = os.path.splitext(file_path)
49         book = Book.from_xml_file(file_path, overwrite=options.get('force'),
50                                   dont_build=dont_build,
51                                   search_index_tags=False)
52         for ebook_format in Book.ebook_formats:
53             if os.path.isfile(file_base + '.' + ebook_format):
54                 getattr(book, '%s_file' % ebook_format).save(
55                     '%s.%s' % (book.slug, ebook_format), 
56                     File(file(file_base + '.' + ebook_format)),
57                     save=False
58                     )
59                 if verbose:
60                     print "Importing %s.%s" % (file_base, ebook_format)
61         book.save()
62
63     def import_picture(self, file_path, options, continue_on_error=True):
64         try:
65             image_store = ImageStore(os.path.dirname(file_path))
66             picture = Picture.from_xml_file(file_path, image_store=image_store, overwrite=options.get('force'))
67         except Exception, ex:
68             if continue_on_error:                
69                 print "%s: %s" % (file_path, ex)
70                 return
71             else:
72                 raise ex
73         return picture
74
75     #    @profile
76     def handle(self, *directories, **options):
77         from django.db import transaction
78
79         self.style = color_style()
80         
81         verbose = options.get('verbose')
82         force = options.get('force')
83         show_traceback = options.get('traceback', False)
84         import_picture = options.get('import_picture')
85
86         wait_until = None
87         if options.get('wait_until'):
88             wait_until = time.mktime(time.strptime(options.get('wait_until'), '%Y-%m-%d %H:%M:%S'))
89             if verbose > 0:
90                 print "Will wait until %s; it's %f seconds from now" % (
91                     time.strftime('%Y-%m-%d %H:%M:%S',
92                     time.localtime(wait_until)), wait_until - time.time())
93
94         index = None
95         if options.get('search_index') and not settings.NO_SEARCH_INDEX:
96             index = Index()
97             try:
98                 index.index_tags()
99                 index.index.commit()
100             except Exception, e:
101                 index.index.rollback()
102                 raise e
103
104         # Start transaction management.
105         transaction.commit_unless_managed()
106         transaction.enter_transaction_management()
107         transaction.managed(True)
108
109         files_imported = 0
110         files_skipped = 0
111
112         for dir_name in directories:
113             if not os.path.isdir(dir_name):
114                 print self.style.ERROR("%s: Not a directory. Skipping." % dir_name)
115             else:
116                 # files queue
117                 files = sorted(os.listdir(dir_name))
118                 postponed = {}
119                 while files:
120                     trim_query_log(0)
121                     file_name = files.pop(0)
122                     file_path = os.path.join(dir_name, file_name)
123                     file_base, ext = os.path.splitext(file_path)
124
125                     # Skip files that are not XML files
126                     if not ext == '.xml':
127                         continue
128
129                     if verbose > 0:
130                         print "Parsing '%s'" % file_path
131                     else:
132                         sys.stdout.write('.')
133                         sys.stdout.flush()
134
135                     # Import book files
136                     try:
137                         if import_picture:
138                             self.import_picture(file_path, options)
139                         else:
140                             self.import_book(file_path, options)
141
142                         files_imported += 1
143                         transaction.commit()
144                         
145                     except (Book.AlreadyExists, Picture.AlreadyExists):
146                         print self.style.ERROR('%s: Book or Picture already imported. Skipping. To overwrite use --force.' %
147                             file_path)
148                         files_skipped += 1
149
150                     except Book.DoesNotExist, e:
151                         if file_name not in postponed or postponed[file_name] < files_imported:
152                             # push it back into the queue, maybe the missing child will show up
153                             if verbose:
154                                 print self.style.NOTICE('Waiting for missing children')
155                             files.append(file_name)
156                             postponed[file_name] = files_imported
157                         else:
158                             # we're in a loop, nothing's being imported - some child is really missing
159                             raise e
160
161         # Print results
162         print
163         print "Results: %d files imported, %d skipped, %d total." % (
164             files_imported, files_skipped, files_imported + files_skipped)
165         print
166
167         if wait_until:
168             print 'Waiting...'
169             try:
170                 time.sleep(wait_until - time.time())
171             except IOError:
172                 print "it's already too late"
173
174         transaction.commit()
175         transaction.leave_transaction_management()