X-Git-Url: https://git.mdrn.pl/librarian.git/blobdiff_plain/1ce2c1255aee01fab9940fc26d251767bbf8c960..a2f8ee881d66601e9cb714069dc88d3ed9703db6:/librarian/pdf.py diff --git a/librarian/pdf.py b/librarian/pdf.py index 07272f2..f8a4d73 100644 --- a/librarian/pdf.py +++ b/librarian/pdf.py @@ -21,7 +21,7 @@ from lxml.etree import XMLSyntaxError, XSLTApplyError from librarian.dcparser import Person from librarian.parser import WLDocument -from librarian import ParseError, DCNS +from librarian import ParseError, DCNS, get_resource from librarian import functions @@ -32,7 +32,7 @@ functions.reg_ends_white() functions.reg_texcommand() STYLESHEETS = { - 'wl2tex': 'xslt/wl2tex.xslt', + 'wl2tex': 'pdf/wl2tex.xslt', } @@ -128,18 +128,17 @@ def hack_motifs(doc): def parse_creator(doc): - """ find all dc:creator tags and add dc:creator_parsed with forenames first """ - for creator in doc.findall('//'+DCNS('creator')): - p = Person.from_text(creator.text) - creator_parsed = deepcopy(creator) - creator_parsed.tag = DCNS('creator_parsed') - creator_parsed.text = ' '.join(p.first_names + (p.last_name,)) - creator.getparent().insert(0, creator_parsed) + """ find all dc:creator and dc.contributor tags and add *_parsed versions with forenames first """ + for person in doc.xpath("|".join('//dc:'+(tag) for tag in ( + 'creator', 'contributor.translator', 'contributor.editor', 'contributor.technical_editor')), + namespaces = {'dc': str(DCNS)})[::-1]: + p = Person.from_text(person.text) + person_parsed = deepcopy(person) + person_parsed.tag = person.tag + '_parsed' + person_parsed.text = p.readable() + person.getparent().insert(0, person_parsed) -def get_resource(path): - return os.path.join(os.path.dirname(__file__), path) - def get_stylesheet(name): return get_resource(STYLESHEETS[name]) @@ -227,7 +226,7 @@ def transform(provider, slug=None, file_path=None, # LaTeX -> PDF shutil.copy(get_resource('pdf/wl.sty'), temp) - shutil.copy(get_resource('pdf/wl-logo.png'), temp) + shutil.copy(get_resource('res/wl-logo.png'), temp) cwd = os.getcwd() os.chdir(temp) @@ -289,9 +288,9 @@ def load_including_children(provider, slug=None, uri=None, file_path=None): parse_dublincore=True) f.close() - + print document.book_info for child_uri in document.book_info.parts: + print child_uri child = load_including_children(provider, uri=child_uri) document.edoc.getroot().append(child.edoc.getroot()) - return document