X-Git-Url: https://git.mdrn.pl/librarian.git/blobdiff_plain/773612b400fb85103153032b193b1434d136a7ef..9a04110484aaeb16d6b6865f86039aba7e5540e5:/librarian/pypdf.py
diff --git a/librarian/pypdf.py b/librarian/pypdf.py
index 4cc4d1d..6d6e0aa 100644
--- a/librarian/pypdf.py
+++ b/librarian/pypdf.py
@@ -10,20 +10,23 @@ with TeXML, then runs it by XeLaTeX.
"""
from __future__ import with_statement
+from copy import deepcopy
import os
import os.path
import shutil
from StringIO import StringIO
from tempfile import mkdtemp, NamedTemporaryFile
import re
+import random
from copy import deepcopy
from subprocess import call, PIPE
+from urllib2 import urlopen
from Texml.processor import process
from lxml import etree
from lxml.etree import XMLSyntaxError, XSLTApplyError
-from xmlutils import Xmill, tag, tagged, ifoption
+from xmlutils import Xmill, tag, tagged, ifoption, tag_open_close
from librarian.dcparser import Person
from librarian.parser import WLDocument
from librarian import ParseError, DCNS, get_resource, IOFile, Format
@@ -49,15 +52,21 @@ def escape(really):
return deco
-def cmd(name, pass_text=False):
- def wrap(self, element):
- pre = u'' % name
+def cmd(name, parms=None):
+ def wrap(self, element=None):
+ pre, post = tag_open_close('cmd', name=name)
- if pass_text:
- pre += "%s" % element.text
- return pre + ''
+ if parms:
+ for parm in parms:
+ e = etree.Element("parm")
+ e.text = parm
+ pre += etree.tostring(e)
+ if element is not None:
+ pre += ""
+ post = "" + post
+ return pre, post
else:
- return pre, ''
+ return pre + post
return wrap
@@ -74,7 +83,7 @@ class EduModule(Xmill):
def swap_endlines(txt):
if self.options['strofa']:
- txt = txt.replace("/\n", '')
+ txt = txt.replace("/\n", '')
return txt
self.register_text_filter(functions.substitute_entities)
self.register_text_filter(mark_alien_characters)
@@ -99,11 +108,15 @@ class EduModule(Xmill):
u''
@escape(True)
- def get_authors(self, element):
- authors = self.get_dc(element, 'creator.expert') + \
- self.get_dc(element, 'creator.scenario') + \
- self.get_dc(element, 'creator.textbook')
- return u', '.join(authors)
+ def get_authors(self, element, which=None):
+ dc = self.options['wldoc'].book_info
+ if which is None:
+ authors = dc.authors_textbook + \
+ dc.authors_scenario + \
+ dc.authors_expert
+ else:
+ authors = getattr(dc, "authors_%s" % which)
+ return u', '.join(author.readable() for author in authors)
@escape(1)
def get_title(self, element):
@@ -124,9 +137,13 @@ class EduModule(Xmill):
\\usepackage{morefloats}
}{}'''),
u'''\\def\\authors{%s}''' % self.get_authors(element),
+ u'''\\def\\authorsexpert{%s}''' % self.get_authors(element, 'expert'),
+ u'''\\def\\authorsscenario{%s}''' % self.get_authors(element, 'scenario'),
+ u'''\\def\\authorstextbook{%s}''' % self.get_authors(element, 'textbook'),
+
u'''\\author{\\authors}''',
u'''\\title{%s}''' % self.get_title(element),
- u'''\\def\\bookurl{%s}''' % self.get_dc(element, 'identifier.url', True),
+ u'''\\def\\bookurl{%s}''' % self.options['wldoc'].book_info.url.canonical(),
u'''\\def\\rightsinfo{%s}''' % self.get_rightsinfo(element),
u'']
@@ -138,7 +155,7 @@ class EduModule(Xmill):
return u"""
- """, """"""
+ """, """"""
@escape(1)
def handle_texcommand(self, element):
@@ -189,7 +206,7 @@ class EduModule(Xmill):
handle_wyroznienie = \
handle_texcommand
- _handle_strofa = cmd("strofa", True)
+ _handle_strofa = cmd("strofa")
def handle_strofa(self, element):
self.options = {'strofa': True}
@@ -222,7 +239,7 @@ class EduModule(Xmill):
counter = self.activity_counter
return u"""
-
+
%(counter)d.
%(czas)s
@@ -250,12 +267,17 @@ class EduModule(Xmill):
return
def handle_lista(self, element, attrs={}):
+ if not element.findall("punkt"):
+ return None
ltype = element.attrib.get('typ', 'punkt')
if ltype == 'slowniczek':
- surl = element.attrib.get('href', None)
+ surl = element.attrib.get('src', None)
+ if surl is None:
+ # print '** missing src on , setting default'
+ surl = 'http://edukacjamedialna.edu.pl/slowniczek'
sxml = None
if surl:
- sxml = etree.fromstring(self.options['provider'].by_uri(surl).get_string())
+ sxml = etree.fromstring(self.options['wldoc'].provider.by_uri(surl).get_string())
self.options = {'slowniczek': True, 'slowniczek_xml': sxml }
listcmd = {'num': 'enumerate',
@@ -271,16 +293,19 @@ class EduModule(Xmill):
def handle_cwiczenie(self, element):
exercise_handlers = {
- 'wybor': Wybor}
- # 'uporzadkuj': Uporzadkuj,
- # 'luki': Luki,
- # 'zastap': Zastap,
- # 'przyporzadkuj': Przyporzadkuj,
- # 'prawdafalsz': PrawdaFalsz
+ 'wybor': Wybor,
+ 'uporzadkuj': Uporzadkuj,
+ 'luki': Luki,
+ 'zastap': Zastap,
+ 'przyporzadkuj': Przyporzadkuj,
+ 'prawdafalsz': PrawdaFalsz
+ }
typ = element.attrib['typ']
+ self.exercise_counter += 1
if not typ in exercise_handlers:
return '(no handler)'
+ self.options = {'exercise_counter': self.exercise_counter}
handler = exercise_handlers[typ](self.options)
return handler.generate(element)
@@ -291,7 +316,7 @@ class EduModule(Xmill):
definiens_s = ''
# let's pull definiens from another document
- if self.options['slowniczek_xml'] and (not nxt or nxt.tag != 'definiens'):
+ if self.options['slowniczek_xml'] is not None and (nxt is None or nxt.tag != 'definiens'):
sxml = self.options['slowniczek_xml']
assert element.text != ''
defloc = sxml.xpath("//definiendum[text()='%s']" % element.text)
@@ -322,7 +347,7 @@ class EduModule(Xmill):
# else: frames_c = ""
# return u""""
return u'''
-tabular%s
+tabular%s
''' % ('l' * max_col), \
u'''tabular'''
@@ -333,10 +358,43 @@ class EduModule(Xmill):
@escape(1)
def handle_kol(self, element):
if element.getnext() is not None:
- return u"", u''
+ return u"", u''
return u"", u""
- handle_link = cmd('em', True)
+ def handle_link(self, element):
+ if element.attrib.get('url'):
+ url = element.attrib.get('url')
+ if url == element.text:
+ return cmd('url')(self, element)
+ else:
+ return cmd('href', parms=[element.attrib['url']])(self, element)
+ else:
+ return cmd('emph')(self, element)
+
+ def handle_obraz(self, element):
+ frmt = self.options['format']
+ name = element.attrib['nazwa'].strip()
+ image = frmt.get_image(name.strip())
+ img_path = "obraz/%s" % name.replace("_", "")
+ frmt.attachments[img_path] = image
+ return cmd("obraz", parms=[img_path])(self)
+
+ def handle_video(self, element):
+ url = element.attrib.get('url')
+ if not url:
+ print '!!