-def hyphenate_and_fix_conjunctions(source_tree):
- """ hyphenate only powiesc, opowiadanie and wywiad tag"""
- texts = etree.XPath('//*[self::powiesc|self::opowiadanie|self::wywiad]//text()')(source_tree)
+def squeeze_whitespace(s):
+ return re.sub(b'\\s+', b' ', s)
+
+
+def set_hyph_language(source_tree):
+ def get_short_lng_code(text):
+ result = ''
+ text = ''.join(text)
+ with open(get_resource('res/ISO-639-2_8859-1.txt'), 'rb') as f:
+ for line in f.read().decode('latin1').split('\n'):
+ list = line.strip().split('|')
+ if list[0] == text:
+ result = list[2]
+ if result == '':
+ return text
+ else:
+ return result
+ bibl_lng = etree.XPath('//dc:language//text()',
+ namespaces={'dc': str(DCNS)})(source_tree)
+ short_lng = get_short_lng_code(bibl_lng[0])
+ try:
+ return Hyphenator(get_resource('res/hyph-dictionaries/hyph_' +
+ short_lng + '.dic'))
+ except:
+ pass
+
+
+def hyphenate_and_fix_conjunctions(source_tree, hyph):
+ texts = etree.XPath('/utwor/*[2]//text()')(source_tree)