Fix: manage.py importbooks -P means: don't build pdf.

[wolnelektury.git] / apps / catalogue / models.py
diff --git a/apps/catalogue/models.py b/apps/catalogue/models.py

index ead5ba0..930f98d 100644 (file)
--- a/apps/catalogue/models.py
+++ b/apps/catalogue/models.py
@@ -22,14 +22,14 @@ from django.conf import settings
  from newtagging.models import TagBase, tags_updated
  from newtagging import managers
  from catalogue.fields import JSONField, OverwritingFileField
  from newtagging.models import TagBase, tags_updated
  from newtagging import managers
  from catalogue.fields import JSONField, OverwritingFileField
-from catalogue.utils import ExistingFile
+from catalogue.utils import ExistingFile, BookImportDocProvider
  
  from librarian import dcparser, html, epub, NoDublinCore
  import mutagen
  from mutagen import id3
  from slughifi import slughifi
  from sortify import sortify
  
  from librarian import dcparser, html, epub, NoDublinCore
  import mutagen
  from mutagen import id3
  from slughifi import slughifi
  from sortify import sortify
-
+from os import unlink
  
  TAG_CATEGORIES = (
      ('author', _('author')),
  
  TAG_CATEGORIES = (
      ('author', _('author')),
@@ -51,6 +51,7 @@ MEDIA_FORMATS = (
  # not quite, but Django wants you to set a timeout
  CACHE_FOREVER = 2419200  # 28 days
  
  # not quite, but Django wants you to set a timeout
  CACHE_FOREVER = 2419200  # 28 days
  
+
  class TagSubcategoryManager(models.Manager):
      def __init__(self, subcategory):
          super(TagSubcategoryManager, self).__init__()
  class TagSubcategoryManager(models.Manager):
      def __init__(self, subcategory):
          super(TagSubcategoryManager, self).__init__()
@@ -295,9 +296,9 @@ class Book(models.Model):
      xml_file      = models.FileField(_('XML file'), upload_to=book_upload_path('xml'), blank=True)
      html_file     = models.FileField(_('HTML file'), upload_to=book_upload_path('html'), blank=True)
      pdf_file      = models.FileField(_('PDF file'), upload_to=book_upload_path('pdf'), blank=True)
      xml_file      = models.FileField(_('XML file'), upload_to=book_upload_path('xml'), blank=True)
      html_file     = models.FileField(_('HTML file'), upload_to=book_upload_path('html'), blank=True)
      pdf_file      = models.FileField(_('PDF file'), upload_to=book_upload_path('pdf'), blank=True)
-    epub_file     = models.FileField(_('EPUB file'), upload_to=book_upload_path('epub'), blank=True)    
-    txt_file      = models.FileField(_('TXT file'), upload_to=book_upload_path('txt'), blank=True)        
-
+    epub_file     = models.FileField(_('EPUB file'), upload_to=book_upload_path('epub'), blank=True)
+    txt_file      = models.FileField(_('TXT file'), upload_to=book_upload_path('txt'), blank=True)
+    
      parent        = models.ForeignKey('self', blank=True, null=True, related_name='children')
      objects  = models.Manager()
      tagged   = managers.ModelTaggedItemManager(Tag)
      parent        = models.ForeignKey('self', blank=True, null=True, related_name='children')
      objects  = models.Manager()
      tagged   = managers.ModelTaggedItemManager(Tag)
@@ -503,34 +504,49 @@ class Book(models.Model):
          return bool(self.has_media("ogg"))
      has_ogg_file.short_description = 'OGG'
      has_ogg_file.boolean = True
          return bool(self.has_media("ogg"))
      has_ogg_file.short_description = 'OGG'
      has_ogg_file.boolean = True
-    
+
      def has_daisy_file(self):
          return bool(self.has_media("daisy"))
      has_daisy_file.short_description = 'DAISY'
      def has_daisy_file(self):
          return bool(self.has_media("daisy"))
      has_daisy_file.short_description = 'DAISY'
-    has_daisy_file.boolean = True    
-    
+    has_daisy_file.boolean = True
+
+    def build_pdf(self):
+        """ (Re)builds the pdf file.
+
+        """
+        from librarian import pdf, ParseError
+        from tempfile import NamedTemporaryFile
+        import os
+
+        try:
+            path, fname = os.path.realpath(self.xml_file.path).rsplit('/', 1)
+            try:
+                pdf_file = NamedTemporaryFile(delete=False)
+
+                pdf.transform(BookImportDocProvider(self),
+                          file_path=str(self.xml_file.path),
+                          output_file=pdf_file,
+                          )
+
+                self.pdf_file.save('%s.pdf' % self.slug, File(open(pdf_file.name)))
+            finally:
+                unlink(pdf_file.name)
+
+        except ParseError, e:
+            print '%(file)s:%(name)s:%(message)s; use -v to see more output' % {
+                'file': self.xml_file.path,
+                'name': e.__class__.__name__,
+                'message': e
+                }
+
      def build_epub(self, remove_descendants=True):
          """ (Re)builds the epub file.
              If book has a parent, does nothing.
              Unless remove_descendants is False, descendants' epubs are removed.
          """
      def build_epub(self, remove_descendants=True):
          """ (Re)builds the epub file.
              If book has a parent, does nothing.
              Unless remove_descendants is False, descendants' epubs are removed.
          """
-    
          from StringIO import StringIO
          from hashlib import sha1
          from django.core.files.base import ContentFile
          from StringIO import StringIO
          from hashlib import sha1
          from django.core.files.base import ContentFile
-        from librarian import DocProvider
-
-        class BookImportDocProvider(DocProvider):
-            """ used for joined EPUBs """
-
-            def __init__(self, book):
-                self.book = book
-
-            def by_slug(self, slug):
-                if slug == self.book.slug:
-                    return self.book.xml_file
-                else:
-                    return Book.objects.get(slug=slug).xml_file
  
          if self.parent:
              # don't need an epub
  
          if self.parent:
              # don't need an epub
@@ -633,7 +649,7 @@ class Book(models.Model):
              xml_file.close()
  
      @classmethod
              xml_file.close()
  
      @classmethod
-    def from_text_and_meta(cls, raw_file, book_info, overwrite=False, build_epub=True, build_txt=True):
+    def from_text_and_meta(cls, raw_file, book_info, overwrite=False, build_epub=True, build_txt=True, build_pdf=True):
          import re
  
          # check for parts before we do anything
          import re
  
          # check for parts before we do anything
@@ -706,6 +722,9 @@ class Book(models.Model):
          if not settings.NO_BUILD_EPUB and build_epub:
              book.root_ancestor.build_epub()
  
          if not settings.NO_BUILD_EPUB and build_epub:
              book.root_ancestor.build_epub()
  
+        if not settings.NO_BUILD_PDF and build_pdf:
+            book.root_ancestor.build_pdf()
+
          book_descendants = list(book.children.all())
          # add l-tag to descendants and their fragments
          # delete unnecessary EPUB files
          book_descendants = list(book.children.all())
          # add l-tag to descendants and their fragments
          # delete unnecessary EPUB files