X-Git-Url: https://git.mdrn.pl/redakcja.git/blobdiff_plain/64b40d8e431d74335d88551554cce94d1d2e07e6..723f0aeedb81b9aabb213d5e8b74653e73a9eb38:/apps/catalogue/management/commands/make_master.py diff --git a/apps/catalogue/management/commands/make_master.py b/apps/catalogue/management/commands/make_master.py index 5d907b90..b2622013 100644 --- a/apps/catalogue/management/commands/make_master.py +++ b/apps/catalogue/management/commands/make_master.py @@ -2,12 +2,15 @@ from django.core.management.base import BaseCommand from django.core.management.color import color_style +from django.utils.encoding import smart_unicode from catalogue.management.prompt import confirm from catalogue.models import Book from optparse import make_option from datetime import date import re from slughifi import slughifi +from lxml import etree +from librarian import WLURI dc_fixed = { @@ -16,11 +19,12 @@ dc_fixed = { 'rights_license': u'http://creativecommons.org/licenses/by-sa/3.0/', } +dc_namespaces = { "dc": "http://purl.org/dc/elements/1.1/" } class Command(BaseCommand): option_list = BaseCommand.option_list + ( - make_option('-s', '--slug', dest='slug', help="Slug for master module"), - make_option('-F', '--file', dest='slugs_file', help="file with child module slugs per line"), + make_option('-s', '--slug', dest='slug', help="Slug for master module (if empty will be generated from title)"), + make_option('-F', '--file', dest='slugs_file', help="file with child module titles per line"), make_option('-t', '--title', dest='title', default='', help="title of master module"), make_option('-l', '--level', dest='audience', default='', help='Audience level'), ) @@ -31,14 +35,54 @@ class Command(BaseCommand): return True return False + def adopt(self, child, master, typ_, audience_, commit_args): + fc = child[0] + txt = fc.materialize() + changed = False + try: + t = etree.fromstring(txt) + except etree.XMLSyntaxError, e: + print "cannot read xml in part: %s" % child.slug + print unicode(e) + return + wluri = WLURI(t.xpath("//dc:identifier.url", namespaces=dc_namespaces)[0].text) + typ = t.xpath("//dc:type", namespaces=dc_namespaces) + if not typ: + print "no type in DC, inserting under format" + fmt = t.xpath("//dc:format", namespaces=dc_namespaces) + container = fmt.getparent() + typ = etree.SubElement(container, etree.QName('dc', 'type')) + container.insert(typ, container.index(fmt)+1) + changed = True + else: + typ = typ[0] + if typ.text != typ_: + print "type is '%s', setting to '%s'" % (typ.text, typ_) + changed = True + typ.text = typ_ + #audience = t.xpath("//dc:audience", namespaces=dc_namespaces)[0] + #if audience.text != audience_: + # print "audience is '%s', setting to '%s'" % (audience.text, audience_) + # changed = True + # audience.text = audience_ + if changed: + print "will commit." + fc.commit(etree.tostring(t, encoding=unicode), **commit_args) + return wluri + + def gen_xml(self, options, synthetic_modules=[], course_modules=[], project_modules=[]): holder = {} holder['xml'] = u"" + slug = options['slug'] + if not slug: + slug = slughifi(options['title']) def p(t): holder['xml'] += u"%s\n" % t def dc(k, v): + v = smart_unicode(v) p(u'%s' % (k, v, k)) def t(tag, ct): @@ -52,12 +96,12 @@ class Command(BaseCommand): p(u'') dc(u'title', options['title']) - for slug in synthetic_modules: - dc(u'relation.hasChild.synthetic', slug_url(slug)) - for slug in course_modules: - dc(u'relation.hasChild.course', slug_url(slug)) - for slug in project_modules: - dc(u'relation.hasChild.project', slug_url(slug)) + for s in synthetic_modules: + dc(u'relation.hasPart', unicode(s)) + for s in course_modules: + dc(u'relation.hasPart', unicode(s)) + for s in project_modules: + dc(u'relation.hasPart', unicode(s)) dc(u'publisher', u'Fundacja Nowoczesna Polska') # dc(u'subject.competence', meta.get(u'Wybrana kompetencja z Katalogu', u'')) # dc(u'subject.curriculum', meta.get(u'Odniesienie do podstawy programowej', u'')) @@ -65,13 +109,12 @@ class Command(BaseCommand): ## keyword = keyword.strip() ## dc(u'subject', keyword) dc(u'description', dc_fixed['description']) - dc(u'identifier.url', u'http://edukacjamedialna.edu.pl/%s' % options['slug']) + dc(u'identifier.url', u'http://edukacjamedialna.edu.pl/%s' % slug) dc(u'rights', dc_fixed['rights']) dc(u'rights.license', dc_fixed['rights_license']) - dc(u'format', u'synthetic, course, project') - dc(u'type', u'text') + dc(u'format', u'xml') + dc(u'type', u'section') dc(u'date', date.strftime(date.today(), "%Y-%m-%d")) - dc(u'audience', options['audience']) dc(u'language', u'pol') p(u'') p(u'') @@ -121,14 +164,16 @@ class Command(BaseCommand): print "Book for title %s does not exist" % t continue if self.looks_like_synthetic(t): - synthetic_modules.append(b.slug) + wlurl = self.adopt(b, master, 'synthetic', options['audience'], commit_args) + synthetic_modules.append(wlurl) else: - course_modules.append(b.slug) + wlurl = self.adopt(b, master, 'course', options['audience'], commit_args) + course_modules.append(wlurl) except Exception, e: print "Error getting slug list (file %s): %s" % (options['slugs_file'], e) - print "synthetic: %s" % synthetic_modules - print "course: %s" % course_modules + print "synthetic: %s" % [unicode(z) for z in synthetic_modules] + print "course: %s" % [unicode(z) for z in course_modules] xml = self.gen_xml(options, synthetic_modules, course_modules) c = master[0]