X-Git-Url: https://git.mdrn.pl/librarian.git/blobdiff_plain/1e0f8d82649a23f695333d5ef4588e8b60afbe99..a3be479506edf42dc58feb22b26e4f5da1e49edd:/librarian/functions.py diff --git a/librarian/functions.py b/librarian/functions.py index 08f920d..b88a7fb 100644 --- a/librarian/functions.py +++ b/librarian/functions.py @@ -7,6 +7,7 @@ from lxml import etree import re from librarian.dcparser import Person +from librarian import get_resource def _register_function(f): """ Register extension function with lxml """ @@ -14,7 +15,7 @@ def _register_function(f): ns[f.__name__] = f -def reg_substitute_entities(): +def reg_substitute_entities(): ENTITY_SUBSTITUTIONS = [ (u'---', u'—'), (u'--', u'–'), @@ -102,5 +103,21 @@ def reg_texcommand(): text = ''.join(text) return re.sub(r'[^a-zA-Z]', '', text).strip() _register_function(texcommand) + +def reg_lang_code_3to2(): + def lang_code_3to2(context, text): + """Convert 3-letter language code to 2-letter code""" + result = '' + text = ''.join(text) + with open(get_resource('res/ISO-639-2_8859-1.txt'), 'rb') as f: + for line in f: + list = line.strip().split('|') + if list[0] == text: + result=list[2] + if result == '': + return text + else: + return result + _register_function(lang_code_3to2)