some epub/mobi fixes

[librarian.git] / librarian / mobi.py
diff --git a/librarian/mobi.py b/librarian/mobi.py

index 62b275c..cd894fe 100755 (executable)
--- a/librarian/mobi.py
+++ b/librarian/mobi.py
@@ -3,23 +3,15 @@
  # This file is part of Librarian, licensed under GNU Affero GPLv3 or later.
  # Copyright © Fundacja Nowoczesna Polska. See NOTICE for more information.
  #
-from __future__ import with_statement
-
  import os
  import os.path
  import subprocess
-from StringIO import StringIO
-from copy import deepcopy
-from lxml import etree
-import zipfile
  from tempfile import NamedTemporaryFile
-from shutil import rmtree
-
-import sys
-
-from librarian import epub
+from lxml import etree
  
-from librarian import functions, get_resource
+from librarian.cover import WLCover
+from librarian import epub, get_resource, NoDublinCore, RDFNS
+from librarian.dcparser import BookInfo
  
  
  def transform(provider, slug=None, file_path=None, output_file=None, output_dir=None, make_dir=False, verbose=False,
@@ -30,12 +22,29 @@ def transform(provider, slug=None, file_path=None, output_file=None, output_dir=
      slug: slug of file to process, available by provider
      output_file: path to output file
      output_dir: path to directory to save output file to; either this or output_file must be present
-    make_dir: writes output to <output_dir>/<author>/<slug>.epub instead of <output_dir>/<slug>.epub
+    make_dir: writes output to <output_dir>/<author>/<slug>.mobi instead of <output_dir>/<slug>.mobi
      sample=n: generate sample e-book (with at least n paragraphs)
      cover: a cover.Cover object
      flags: less-advertising,
      """
  
+    # read metadata from the first file
+    if file_path:
+        if slug:
+            raise ValueError('slug or file_path should be specified, not both')
+        f = open(file_path, 'r')
+        input_xml = etree.parse(f)
+        f.close()
+    else:
+        if not slug:
+            raise ValueError('either slug or file_path should be specified')
+        input_xml = etree.parse(provider[slug])
+
+    metadata = input_xml.find('.//'+RDFNS('Description'))
+    if metadata is None:
+        raise NoDublinCore('Document has no DublinCore - which is required.')
+    book_info = BookInfo.from_element(input_xml)
+
      # if output to dir, create the file
      if output_dir is not None:
          if make_dir:
@@ -50,11 +59,26 @@ def transform(provider, slug=None, file_path=None, output_file=None, output_dir=
          else:
              output_file = os.path.join(output_dir, os.path.splitext(os.path.basename(file_path))[0] + '.mobi')
  
+    # provide a cover by default
+    if not cover:
+        cover = WLCover
+    cover_file = NamedTemporaryFile(suffix='.png', delete=False)
+    c = cover(book_info.author.readable(), book_info.title)
+    c.save(cover_file)
+
      epub_file = NamedTemporaryFile(suffix='.epub', delete=False)
      if not flags:
          flags = []
      flags = list(flags) + ['without-fonts']
      epub.transform(provider, file_path=file_path, output_file=epub_file, verbose=verbose,
-              sample=sample, cover=None, flags=flags, style=get_resource('mobi/style.css'))
-    subprocess.check_call(['ebook-convert', epub_file.name, output_file])
+              sample=sample, html_toc=True, flags=flags, style=get_resource('mobi/style.css'))
+
+    if verbose:
+        kwargs = {}
+    else:
+        devnull = open("/dev/null", 'w')
+        kwargs = {"stdout": devnull, "stderr": devnull}
+    subprocess.check_call(['ebook-convert', epub_file.name, output_file,
+            '--no-inline-toc', '--cover=%s' % cover_file.name], **kwargs)
      os.unlink(epub_file.name)
+    os.unlink(cover_file.name)