add vimeo

[librarian.git] / librarian / formats / epub / __init__.py
diff --git a/librarian/formats/epub/__init__.py b/librarian/formats/epub/__init__.py

index 708b063..4e2e6e5 100644 (file)
--- a/librarian/formats/epub/__init__.py
+++ b/librarian/formats/epub/__init__.py
@@ -4,6 +4,7 @@
  # Copyright © Fundacja Nowoczesna Polska. See NOTICE for more information.
  #
  import os
+import re
  import urllib
  from copy import deepcopy
  from mimetypes import guess_type
@@ -12,7 +13,7 @@ import zipfile
  from urllib2 import urlopen
  
  from lxml import etree
-from librarian import OPFNS, NCXNS, XHTMLNS, DCNS
+from librarian import OPFNS, NCXNS, XHTMLNS, DCNS, BuildError, VIDEO_PROVIDERS
  from librarian import core
  from librarian.formats import Format
  from librarian.formats.cover.evens import EvensCover
@@ -34,8 +35,11 @@ class EpubFormat(Format):
          if cover is not None:
              self.cover = cover
  
-    def dc(self, tag):
-        return self.doc.meta.get_one(DCNS(tag))
+    def dc(self, tag, multiple=False):
+        if multiple:
+            return ', '.join(self.doc.meta.get(DCNS(tag)))
+        else:
+            return self.doc.meta.get_one(DCNS(tag))
  
      def build(self, ctx=None):
  
@@ -157,7 +161,7 @@ class EpubFormat(Format):
              'Information about the resource',
              'Publisher: %s' % self.dc('publisher'),
              'Rights: %s' % self.dc('rights'),
-            'Intended audience: %s' % self.dc('audience'),
+            'Intended audience: %s' % self.dc('audience', multiple=True),
              self.dc('description'),
              'Resource prepared using MIL/PEER editing platform.',
              'Source available at %s' % ctx.source_url,
@@ -229,6 +233,24 @@ class EpubRenderer(TreeRenderer):
          yield wrapper
  
  
+class NaturalText(EpubRenderer):
+    def render_text(self, text, ctx):
+        root, inner = self.text_container()
+        chunks = re.split('(?<=\s\w) ', text)
+        inner.text = chunks[0]
+        for chunk in chunks[1:]:
+            x = etree.Entity("nbsp")
+            x.tail = chunk
+            inner.append(x)
+        return root
+
+
+class Silent(EpubRenderer):
+    def render_text(self, text, ctx):
+        root, inner = self.text_container()
+        return root
+
+
  class Footnotes(object):
      def __init__(self):
          self.counter = 0
@@ -290,7 +312,7 @@ class TOC(object):
  
  # Renderers
  
-class AsideR(EpubRenderer):
+class AsideR(NaturalText):
      def render(self, element, ctx):
          outputs = list(super(AsideR, self).render(element, ctx))
          anchor = ctx.footnotes.append(outputs)
@@ -299,8 +321,10 @@ class AsideR(EpubRenderer):
          yield wrapper
  EpubFormat.renderers.register(core.Aside, None, AsideR('div'))
  
+EpubFormat.renderers.register(core.Aside, 'comment', Silent())
  
-class DivR(EpubRenderer):
+
+class DivR(NaturalText):
      def container(self, ctx):
          root, inner = super(DivR, self).container(ctx)
          if getattr(ctx, 'inline', False):
@@ -308,12 +332,20 @@ class DivR(EpubRenderer):
              inner.set('style', 'display: block;')
          return root, inner
  EpubFormat.renderers.register(core.Div, None, DivR('div'))
+EpubFormat.renderers.register(core.Div, 'p', NaturalText('p'))
+
+EpubFormat.renderers.register(core.Div, 'list', NaturalText('ul'))
+EpubFormat.renderers.register(core.Div, 'list.enum', NaturalText('ol'))
+EpubFormat.renderers.register(core.Div, 'item', NaturalText('li'))
+EpubFormat.renderers.register(core.Span, 'item', NaturalText('li'))
  
  
  class DivImageR(EpubRenderer):
      def render(self, element, ctx):
          src = element.attrib.get('src', '')
          ctx.images.append(src)
+        if '/' not in src:
+            raise BuildError('Bad image URL')
          src = src.rsplit('/', 1)[1]
          return super(DivImageR, self).render(element, Context(ctx, src=src))
  
@@ -326,13 +358,28 @@ class DivImageR(EpubRenderer):
  EpubFormat.renderers.register(core.Div, 'img', DivImageR('img'))
  
  
-class HeaderR(EpubRenderer):
+class DivVideoR(Silent):
+    def render(self, element, ctx):
+        src = VIDEO_PROVIDERS[element.attrib.get('provider')]['url'] % element.attrib.get('videoid', '')
+        return super(DivVideoR, self).render(element, Context(ctx, src=src))
+
+    def container(self, ctx):
+        root, inner = super(DivVideoR, self).container(ctx)
+        src = getattr(ctx, 'src', '')
+        link = etree.Element('a', {'href': src})
+        link.text = src
+        inner.append(link)
+        return root, inner
+EpubFormat.renderers.register(core.Div, 'video', DivVideoR('p'))
+
+
+class HeaderR(NaturalText):
      def subcontext(self, element, ctx):
          return Context(ctx, inline=True)
  EpubFormat.renderers.register(core.Header, None, HeaderR('h1'))
  
  
-class SectionR(EpubRenderer):
+class SectionR(NaturalText):
      epub_separate = True
  
      def render(self, element, ctx):
@@ -344,6 +391,21 @@ class SectionR(EpubRenderer):
  EpubFormat.renderers.register(core.Section, None, SectionR())
  
  
-class SpanR(EpubRenderer):
+class SpanR(NaturalText):
      pass
  EpubFormat.renderers.register(core.Span, None, SpanR('span'))
+EpubFormat.renderers.register(core.Span, 'cite', SpanR('i'))
+EpubFormat.renderers.register(core.Span, 'emp', SpanR('b'))
+EpubFormat.renderers.register(core.Span, 'emph', SpanR('i'))
+
+
+class SpanLink(EpubRenderer):
+    def render(self, element, ctx):
+        parts = super(SpanLink, self).render(element, ctx)
+        for part in parts:
+            src = element.attrib.get('href', '')
+            if src.startswith('file://'):
+                src = ctx.files_path + src[7:]
+            part[0].attrib['href'] = src
+            yield part
+EpubFormat.renderers.register(core.Span, 'link', SpanLink('a'))