1 # -*- coding: utf-8 -*-
3 # This file is part of Librarian, licensed under GNU Affero GPLv3 or later.
4 # Copyright © Fundacja Nowoczesna Polska. See NOTICE for more information.
6 from librarian import dcparser
8 from nose.tools import *
9 from os.path import splitext
10 from tests.utils import get_all_fixtures
12 from datetime import date
14 def check_dcparser(xml_file, result_file):
15 xml = file(xml_file).read()
16 result = codecs.open(result_file, encoding='utf-8').read()
17 info = dcparser.BookInfo.from_string(xml).to_dict()
18 should_be = eval(result)
20 assert_equals(info[key], should_be[key])
24 for fixture in get_all_fixtures('dcparser', '*.xml'):
25 base_name = splitext(fixture)[0]
26 yield check_dcparser, fixture, base_name + '.out'
29 def check_serialize(xml_file):
30 xml = file(xml_file).read()
31 info = dcparser.BookInfo.from_string(xml)
34 serialized = etree.tostring(info.to_etree(), encoding=unicode).encode('utf-8')
36 info_bis = dcparser.BookInfo.from_string(serialized)
38 # check if they are the same
39 for key in vars(info):
40 assert_equals(getattr(info, key), getattr(info_bis, key))
41 for key in vars(info_bis):
42 assert_equals(getattr(info, key), getattr(info_bis, key))
46 for fixture in get_all_fixtures('dcparser', '*.xml'):
47 yield check_serialize, fixture
50 assert_equals(dcparser.as_date(u"2010-10-03"), date(2010, 10, 03))
51 assert_equals(dcparser.as_date(u"2011"), date(2011, 1, 1))
52 assert_equals(dcparser.as_date(u"2 poł. XIX w."), date(1950, 1, 1))
53 assert_equals(dcparser.as_date(u"XVII w., l. 20"), date(1720, 1, 1))
54 assert_equals(dcparser.as_date(u"po 1460"), date(1460, 1, 1))
55 assert_equals(dcparser.as_date(u"ok. 1813-1814"), date(1813, 1, 1))
56 assert_equals(dcparser.as_date(u"ok.1876-ok.1886"), date(1876, 1, 1))
57 assert_equals(dcparser.as_date(u"1893/1894"), date(1893, 1, 1))