X-Git-Url: https://git.mdrn.pl/redakcja.git/blobdiff_plain/64b40d8e431d74335d88551554cce94d1d2e07e6..59f6e6616b1b01350f1eaa97ed026e8a8524da1f:/apps/catalogue/management/commands/make_master.py
diff --git a/apps/catalogue/management/commands/make_master.py b/apps/catalogue/management/commands/make_master.py
index 5d907b90..b2622013 100644
--- a/apps/catalogue/management/commands/make_master.py
+++ b/apps/catalogue/management/commands/make_master.py
@@ -2,12 +2,15 @@
from django.core.management.base import BaseCommand
from django.core.management.color import color_style
+from django.utils.encoding import smart_unicode
from catalogue.management.prompt import confirm
from catalogue.models import Book
from optparse import make_option
from datetime import date
import re
from slughifi import slughifi
+from lxml import etree
+from librarian import WLURI
dc_fixed = {
@@ -16,11 +19,12 @@ dc_fixed = {
'rights_license': u'http://creativecommons.org/licenses/by-sa/3.0/',
}
+dc_namespaces = { "dc": "http://purl.org/dc/elements/1.1/" }
class Command(BaseCommand):
option_list = BaseCommand.option_list + (
- make_option('-s', '--slug', dest='slug', help="Slug for master module"),
- make_option('-F', '--file', dest='slugs_file', help="file with child module slugs per line"),
+ make_option('-s', '--slug', dest='slug', help="Slug for master module (if empty will be generated from title)"),
+ make_option('-F', '--file', dest='slugs_file', help="file with child module titles per line"),
make_option('-t', '--title', dest='title', default='', help="title of master module"),
make_option('-l', '--level', dest='audience', default='', help='Audience level'),
)
@@ -31,14 +35,54 @@ class Command(BaseCommand):
return True
return False
+ def adopt(self, child, master, typ_, audience_, commit_args):
+ fc = child[0]
+ txt = fc.materialize()
+ changed = False
+ try:
+ t = etree.fromstring(txt)
+ except etree.XMLSyntaxError, e:
+ print "cannot read xml in part: %s" % child.slug
+ print unicode(e)
+ return
+ wluri = WLURI(t.xpath("//dc:identifier.url", namespaces=dc_namespaces)[0].text)
+ typ = t.xpath("//dc:type", namespaces=dc_namespaces)
+ if not typ:
+ print "no type in DC, inserting under format"
+ fmt = t.xpath("//dc:format", namespaces=dc_namespaces)
+ container = fmt.getparent()
+ typ = etree.SubElement(container, etree.QName('dc', 'type'))
+ container.insert(typ, container.index(fmt)+1)
+ changed = True
+ else:
+ typ = typ[0]
+ if typ.text != typ_:
+ print "type is '%s', setting to '%s'" % (typ.text, typ_)
+ changed = True
+ typ.text = typ_
+ #audience = t.xpath("//dc:audience", namespaces=dc_namespaces)[0]
+ #if audience.text != audience_:
+ # print "audience is '%s', setting to '%s'" % (audience.text, audience_)
+ # changed = True
+ # audience.text = audience_
+ if changed:
+ print "will commit."
+ fc.commit(etree.tostring(t, encoding=unicode), **commit_args)
+ return wluri
+
+
def gen_xml(self, options, synthetic_modules=[], course_modules=[], project_modules=[]):
holder = {}
holder['xml'] = u""
+ slug = options['slug']
+ if not slug:
+ slug = slughifi(options['title'])
def p(t):
holder['xml'] += u"%s\n" % t
def dc(k, v):
+ v = smart_unicode(v)
p(u'%s' % (k, v, k))
def t(tag, ct):
@@ -52,12 +96,12 @@ class Command(BaseCommand):
p(u'')
dc(u'title', options['title'])
- for slug in synthetic_modules:
- dc(u'relation.hasChild.synthetic', slug_url(slug))
- for slug in course_modules:
- dc(u'relation.hasChild.course', slug_url(slug))
- for slug in project_modules:
- dc(u'relation.hasChild.project', slug_url(slug))
+ for s in synthetic_modules:
+ dc(u'relation.hasPart', unicode(s))
+ for s in course_modules:
+ dc(u'relation.hasPart', unicode(s))
+ for s in project_modules:
+ dc(u'relation.hasPart', unicode(s))
dc(u'publisher', u'Fundacja Nowoczesna Polska')
# dc(u'subject.competence', meta.get(u'Wybrana kompetencja z Katalogu', u''))
# dc(u'subject.curriculum', meta.get(u'Odniesienie do podstawy programowej', u''))
@@ -65,13 +109,12 @@ class Command(BaseCommand):
## keyword = keyword.strip()
## dc(u'subject', keyword)
dc(u'description', dc_fixed['description'])
- dc(u'identifier.url', u'http://edukacjamedialna.edu.pl/%s' % options['slug'])
+ dc(u'identifier.url', u'http://edukacjamedialna.edu.pl/%s' % slug)
dc(u'rights', dc_fixed['rights'])
dc(u'rights.license', dc_fixed['rights_license'])
- dc(u'format', u'synthetic, course, project')
- dc(u'type', u'text')
+ dc(u'format', u'xml')
+ dc(u'type', u'section')
dc(u'date', date.strftime(date.today(), "%Y-%m-%d"))
- dc(u'audience', options['audience'])
dc(u'language', u'pol')
p(u'')
p(u'')
@@ -121,14 +164,16 @@ class Command(BaseCommand):
print "Book for title %s does not exist" % t
continue
if self.looks_like_synthetic(t):
- synthetic_modules.append(b.slug)
+ wlurl = self.adopt(b, master, 'synthetic', options['audience'], commit_args)
+ synthetic_modules.append(wlurl)
else:
- course_modules.append(b.slug)
+ wlurl = self.adopt(b, master, 'course', options['audience'], commit_args)
+ course_modules.append(wlurl)
except Exception, e:
print "Error getting slug list (file %s): %s" % (options['slugs_file'], e)
- print "synthetic: %s" % synthetic_modules
- print "course: %s" % course_modules
+ print "synthetic: %s" % [unicode(z) for z in synthetic_modules]
+ print "course: %s" % [unicode(z) for z in course_modules]
xml = self.gen_xml(options, synthetic_modules, course_modules)
c = master[0]