X-Git-Url: https://git.mdrn.pl/librarian.git/blobdiff_plain/d0475d381f12b2c89c7c514c4f7f7d2ebc421d0a..482477cced586463d7f342cdde8482a4d97d7685:/librarian/pypdf.py diff --git a/librarian/pypdf.py b/librarian/pypdf.py index bb2881f..6aadbc4 100644 --- a/librarian/pypdf.py +++ b/librarian/pypdf.py @@ -18,8 +18,7 @@ from urllib2 import urlopen from lxml import etree -from xmlutils import Xmill, tag, tagged, ifoption, tag_open_close -from librarian.dcparser import Person +from xmlutils import Xmill, ifoption, tag_open_close from librarian import DCNS, get_resource, IOFile from librarian import functions from pdf import PDFFormat, substitute_hyphens, fix_hanging @@ -30,10 +29,11 @@ def escape(really): def _wrap(*args, **kw): value = f(*args, **kw) - prefix = (u'' % (really and 1 or 0)) + prefix = (u'' % (1 if really else 0)) postfix = u'' if isinstance(value, list): - import pdb; pdb.set_trace() + import pdb + pdb.set_trace() if isinstance(value, tuple): return prefix + value[0], value[1] + postfix else: @@ -83,20 +83,19 @@ class EduModule(Xmill): def get_dc(self, element, dc_field, single=False): values = map(lambda t: t.text, element.xpath("//dc:%s" % dc_field, namespaces={'dc': DCNS.uri})) if single: - return values[0] + return values[0] if len(values) else '' return values def handle_rdf__RDF(self, _): - "skip metadata in generation" + """skip metadata in generation""" return @escape(True) def get_rightsinfo(self, element): rights_lic = self.get_dc(element, 'rights.license', True) - return u'' + \ - (rights_lic and u'%s' % rights_lic or '') +\ - u'%s' % self.get_dc(element, 'rights', True) +\ - u'' + return u'' + (u'%s' % rights_lic if rights_lic else '') + \ + u'%s' % self.get_dc(element, 'rights', True) + \ + u'' @escape(True) def get_authors(self, element, which=None): @@ -109,90 +108,124 @@ class EduModule(Xmill): authors = getattr(dc, "authors_%s" % which) return u', '.join(author.readable() for author in authors if author) - @escape(1) + @escape(True) def get_title(self, element): return self.get_dc(element, 'title', True) + @escape(True) + def get_description(self, element): + desc = self.get_dc(element, 'description', single=True) + if not desc: + print '!! no description' + return desc + + @escape(True) + def get_curriculum(self, element): + ret = [] + for dc_tag, new in [('subject.curriculum', False), ('subject.curriculum.new', True)]: + identifiers = self.get_dc(element, dc_tag) + if not identifiers: + continue + try: + from curriculum.templatetags.curriculum_tags import curriculum + curr_elements = curriculum(identifiers) + except ImportError: + curr_elements = {'identifiers': identifiers} + items = ['Nowa podstawa programowa:' if new else 'Podstawa programowa:'] + newline = '\n' + if 'currset' in curr_elements: + for (course, level), types in curr_elements['currset'].iteritems(): + label = u'klasa' if new else u'poziom edukacyjny' + lines = [u'%s, %s %s' % (course, level, label)] + for type, currs in types.iteritems(): + lines.append(type) + lines += [curr.title for curr in currs] + items.append(newline.join(lines)) + else: + items += identifiers + ret.append('\n.6em\n'.join( + '%s' % item for item in items)) + return '\n1em\n'.join(ret) + def handle_utwor(self, element): lines = [ u''' - - - \\documentclass[%s]{wl} - \\usepackage{style}''' % self.options['customization_str'], - self.options['has_cover'] and '\usepackage{makecover}', - (self.options['morefloats'] == 'new' and '\usepackage[maxfloats=64]{morefloats}') or - (self.options['morefloats'] == 'old' and '\usepackage{morefloats}') or - (self.options['morefloats'] == 'none' and - u'''\\IfFileExists{morefloats.sty}{ - \\usepackage{morefloats} - }{}'''), - u'''\\def\\authors{%s}''' % self.get_authors(element), - u'''\\def\\authorsexpert{%s}''' % self.get_authors(element, 'expert'), - u'''\\def\\authorsscenario{%s}''' % self.get_authors(element, 'scenario'), - u'''\\def\\authorstextbook{%s}''' % self.get_authors(element, 'textbook'), - - u'''\\author{\\authors}''', - u'''\\title{%s}''' % self.get_title(element), - u'''\\def\\bookurl{%s}''' % self.options['wldoc'].book_info.url.canonical(), - u'''\\def\\rightsinfo{%s}''' % self.get_rightsinfo(element), - u''] + + + \\documentclass[%s]{wl} + \\usepackage{style}''' % self.options['customization_str'], + self.options['has_cover'] and '\usepackage{makecover}', + (self.options['morefloats'] == 'new' and '\usepackage[maxfloats=64]{morefloats}') or + (self.options['morefloats'] == 'old' and '\usepackage{morefloats}') or + (self.options['morefloats'] == 'none' and + u'''\\IfFileExists{morefloats.sty}{ + \\usepackage{morefloats} + }{}'''), + u'''\\def\\authors{%s}''' % self.get_authors(element), + u'''\\def\\authorsexpert{%s}''' % self.get_authors(element, 'expert'), + u'''\\def\\authorsscenario{%s}''' % self.get_authors(element, 'scenario'), + u'''\\def\\authorstextbook{%s}''' % self.get_authors(element, 'textbook'), + u'''\\def\\description{%s}''' % self.get_description(element), + + u'''\\author{\\authors}''', + u'''\\title{%s}''' % self.get_title(element), + u'''\\def\\bookurl{%s}''' % self.options['wldoc'].book_info.url.canonical(), + u'''\\def\\rightsinfo{%s}''' % self.get_rightsinfo(element), + u'''\\def\\curriculum{%s}''' % self.get_curriculum(element), + u'' + ] return u"".join(filter(None, lines)), u'' - - @escape(1) + @escape(True) def handle_powiesc(self, element): return u""" """, """""" - @escape(1) + @escape(True) def handle_texcommand(self, element): cmd = functions.texcommand(element.tag) return u'' % cmd, u'' handle_akap = \ - handle_akap = \ - handle_akap_cd = \ - handle_akap_cd = \ - handle_akap_dialog = \ - handle_akap_dialog = \ - handle_autor_utworu = \ - handle_dedykacja = \ - handle_didaskalia = \ - handle_didask_tekst = \ - handle_dlugi_cytat = \ - handle_dzielo_nadrzedne = \ - handle_lista_osoba = \ - handle_mat = \ - handle_miejsce_czas = \ - handle_motto = \ - handle_motto_podpis = \ - handle_naglowek_akt = \ - handle_naglowek_czesc = \ - handle_naglowek_listy = \ - handle_naglowek_osoba = \ - handle_naglowek_scena = \ - handle_nazwa_utworu = \ - handle_nota = \ - handle_osoba = \ - handle_pa = \ - handle_pe = \ - handle_podtytul = \ - handle_poezja_cyt = \ - handle_pr = \ - handle_pt = \ - handle_sekcja_asterysk = \ - handle_sekcja_swiatlo = \ - handle_separator_linia = \ - handle_slowo_obce = \ - handle_srodtytul = \ - handle_tytul_dziela = \ - handle_wyroznienie = \ - handle_dywiz = \ - handle_texcommand + handle_akap_cd = \ + handle_akap_dialog = \ + handle_autor_utworu = \ + handle_dedykacja = \ + handle_didaskalia = \ + handle_didask_tekst = \ + handle_dlugi_cytat = \ + handle_dzielo_nadrzedne = \ + handle_lista_osoba = \ + handle_mat = \ + handle_miejsce_czas = \ + handle_motto = \ + handle_motto_podpis = \ + handle_naglowek_akt = \ + handle_naglowek_czesc = \ + handle_naglowek_listy = \ + handle_naglowek_osoba = \ + handle_naglowek_scena = \ + handle_nazwa_utworu = \ + handle_nota = \ + handle_osoba = \ + handle_pa = \ + handle_pe = \ + handle_podtytul = \ + handle_poezja_cyt = \ + handle_pr = \ + handle_pt = \ + handle_sekcja_asterysk = \ + handle_sekcja_swiatlo = \ + handle_separator_linia = \ + handle_slowo_obce = \ + handle_srodtytul = \ + handle_tytul_dziela = \ + handle_wyroznienie = \ + handle_dywiz = \ + handle_texcommand def handle_naglowek_rozdzial(self, element): if not self.options['teacher']: @@ -220,6 +253,7 @@ class EduModule(Xmill): def handle_uwaga(self, _e): return None + def handle_extra(self, _e): return None @@ -247,13 +281,16 @@ class EduModule(Xmill): opis = '' n = element.xpath('wskazowki') - if n: wskazowki = submill.generate(n[0]) - - else: wskazowki = '' + if n: + wskazowki = submill.generate(n[0]) + else: + wskazowki = '' n = element.xpath('pomoce') - if n: pomoce = submill.generate(n[0]) - else: pomoce = '' + if n: + pomoce = submill.generate(n[0]) + else: + pomoce = '' forma = ''.join(element.xpath('forma/text()')) @@ -261,7 +298,7 @@ class EduModule(Xmill): counter = self.activity_counter - if element.getnext().tag == 'aktywnosc' or (self.activity_last and self.activity_last.getnext() == element): + if element.getnext().tag == 'aktywnosc' or (len(self.activity_last) and self.activity_last.getnext() == element): counter_tex = """%(counter)d.""" % locals() else: counter_tex = '' @@ -296,7 +333,7 @@ class EduModule(Xmill): def handle_forma(self, *_): return - def handle_lista(self, element, attrs={}): + def handle_lista(self, element, attrs=None): ltype = element.attrib.get('typ', 'punkt') if not element.findall("punkt"): if ltype == 'czytelnia': @@ -309,13 +346,15 @@ class EduModule(Xmill): # print '** missing src on , setting default' surl = 'http://edukacjamedialna.edu.pl/lekcje/slowniczek/' sxml = etree.fromstring(self.options['wldoc'].provider.by_uri(surl).get_string()) - self.options = {'slowniczek': True, 'slowniczek_xml': sxml } + self.options = {'slowniczek': True, 'slowniczek_xml': sxml} - listcmd = {'num': 'enumerate', - 'punkt': 'itemize', - 'alfa': 'itemize', - 'slowniczek': 'itemize', - 'czytelnia': 'itemize'}[ltype] + listcmd = { + 'num': 'enumerate', + 'punkt': 'itemize', + 'alfa': 'itemize', + 'slowniczek': 'itemize', + 'czytelnia': 'itemize' + }[ltype] return u'' % listcmd, u'' @@ -334,7 +373,7 @@ class EduModule(Xmill): typ = element.attrib['typ'] self.exercise_counter += 1 - if not typ in exercise_handlers: + if typ not in exercise_handlers: return '(no handler)' self.options = {'exercise_counter': self.exercise_counter} handler = exercise_handlers[typ](self.options, self.state) @@ -376,20 +415,19 @@ class EduModule(Xmill): max_col = len(ks) self.options = {'columnts': max_col} # styling: - # has_frames = int(element.attrib.get("ramki", "0")) - # if has_frames: frames_c = "framed" - # else: frames_c = "" - # return u"""""" % frames_c, u"
" + # has_frames = int(element.attrib.get("ramki", "0")) + # if has_frames: frames_c = "framed" + # else: frames_c = "" + # return u"""""" % frames_c, u"
" return u''' tabular%s - ''' % ('l' * max_col), \ - u'''tabular''' + ''' % ('l' * max_col), u'''tabular''' - @escape(1) + @escape(True) def handle_wiersz(self, element): return u"", u'' - @escape(1) + @escape(True) def handle_kol(self, element): if element.getnext() is not None: return u"", u'' @@ -424,8 +462,7 @@ class EduModule(Xmill): print '!! unknown