fnp
/
librarian.git
/ blobdiff
commit
grep
author
committer
pickaxe
?
search:
re
summary
|
shortlog
|
log
|
commit
|
commitdiff
|
tree
raw
|
inline
| side by side
fix handling empty xml files
[librarian.git]
/
librarian
/
__init__.py
diff --git
a/librarian/__init__.py
b/librarian/__init__.py
index
ca527f6
..
dbdad5b
100644
(file)
--- a/
librarian/__init__.py
+++ b/
librarian/__init__.py
@@
-1,18
+1,10
@@
# -*- coding: utf-8 -*-
#
# -*- coding: utf-8 -*-
#
-# Copyright © 2008,2009,2010 Fundacja Nowoczesna Polska
-#
# This file is part of Librarian, licensed under GNU Affero GPLv3 or later.
# This file is part of Librarian, licensed under GNU Affero GPLv3 or later.
-#
For full license text see COPYING or <http://www.gnu.org/licenses/agpl.html>
-
+#
Copyright © Fundacja Nowoczesna Polska. See NOTICE for more information.
+#
class ParseError(Exception):
class ParseError(Exception):
-
- def __init__(self, cause, message=None):
- self.cause = cause
- try:
- self.message = message or self.cause.message
- except:
- self.message = "No message."
+ pass
class ValidationError(Exception):
pass
class ValidationError(Exception):
pass
@@
-30,7
+22,7
@@
class XMLNamespace(object):
return '{%s}%s' % (self.uri, tag)
def __contains__(self, tag):
return '{%s}%s' % (self.uri, tag)
def __contains__(self, tag):
- return tag.startswith('{'
+str(self)+
'}')
+ return tag.startswith('{'
+ str(self) +
'}')
def __repr__(self):
return 'XMLNamespace(%r)' % self.uri
def __repr__(self):
return 'XMLNamespace(%r)' % self.uri
@@
-57,7
+49,7
@@
import lxml.etree as etree
import dcparser
DEFAULT_BOOKINFO = dcparser.BookInfo(
import dcparser
DEFAULT_BOOKINFO = dcparser.BookInfo(
- { RDFNS('about'): u'http://wiki.wolnepodreczniki.pl/Lektury:Template'},\
+ { RDFNS('about'): u'http://wiki.wolnepodreczniki.pl/Lektury:Template'},
\
{ DCNS('creator'): [u'Some, Author'],
DCNS('title'): [u'Some Title'],
DCNS('subject.period'): [u'Unknown'],
{ DCNS('creator'): [u'Some, Author'],
DCNS('title'): [u'Some Title'],
DCNS('subject.period'): [u'Unknown'],
@@
-77,18
+69,18
@@
DEFAULT_BOOKINFO = dcparser.BookInfo(
[u"Domena publiczna - zm. [OPIS STANU PRAWNEGO TEKSTU]"] })
def xinclude_forURI(uri):
[u"Domena publiczna - zm. [OPIS STANU PRAWNEGO TEKSTU]"] })
def xinclude_forURI(uri):
- e = etree.Element(
XINS("include")
)
+ e = etree.Element(
XINS("include")
)
e.set("href", uri)
return etree.tostring(e, encoding=unicode)
e.set("href", uri)
return etree.tostring(e, encoding=unicode)
-
+
def wrap_text(ocrtext, creation_date, bookinfo=DEFAULT_BOOKINFO):
"""Wrap the text within the minimal XML structure with a DC template."""
bookinfo.created_at = creation_date
def wrap_text(ocrtext, creation_date, bookinfo=DEFAULT_BOOKINFO):
"""Wrap the text within the minimal XML structure with a DC template."""
bookinfo.created_at = creation_date
-
- dcstring = etree.tostring(bookinfo.to_etree(),\
+
+ dcstring = etree.tostring(bookinfo.to_etree(),
\
method='xml', encoding=unicode, pretty_print=True)
method='xml', encoding=unicode, pretty_print=True)
- return u'<utwor>\n' + dcstring + u'\n<plain-text>\n' + ocrtext +\
+ return u'<utwor>\n' + dcstring + u'\n<plain-text>\n' + ocrtext +
\
u'\n</plain-text>\n</utwor>';
u'\n</plain-text>\n</utwor>';