X-Git-Url: https://git.mdrn.pl/librarian.git/blobdiff_plain/5fed78856949474a36bc5e268517775a9a802e27..00906f2fc0432cede204c7870e6caecf427d7024:/librarian/dcparser.py diff --git a/librarian/dcparser.py b/librarian/dcparser.py index d99aaf0..fff8ac2 100644 --- a/librarian/dcparser.py +++ b/librarian/dcparser.py @@ -6,6 +6,8 @@ from xml.parsers.expat import ExpatError from datetime import date import time +import re +from librarian.util import roman_to_int from librarian import (ValidationError, NoDublinCore, ParseError, DCNS, RDFNS, WLURI) @@ -62,10 +64,17 @@ class Person(object): def as_date(text): try: - try: - t = time.strptime(text, '%Y-%m-%d') - except ValueError: - t = time.strptime(text, '%Y') + # check out the "N. poł X w." syntax + m = re.match(u"([12]) *poł[.]? ([MCDXVI]+) .*[.]?", text) + if m: + half = int(m.groups()[0]) + century = roman_to_int(str(m.groups()[1])) + t = ((century*100 + (half-1)*50), 1, 1) + else: + try: + t = time.strptime(text, '%Y-%m-%d') + except ValueError: + t = time.strptime(text, '%Y') return date(t[0], t[1], t[2]) except ValueError, e: raise ValueError("Unrecognized date format. Try YYYY-MM-DD or YYYY.")