X-Git-Url: https://git.mdrn.pl/librarian.git/blobdiff_plain/fefdce4e24f9e397df5538fe6e7f54b5ece4d841..e18331d927f54751163baf89bb2c93ae0c854a3b:/src/librarian/hyphenator.py?ds=sidebyside diff --git a/src/librarian/hyphenator.py b/src/librarian/hyphenator.py index aa5b4c3..c2fbb81 100644 --- a/src/librarian/hyphenator.py +++ b/src/librarian/hyphenator.py @@ -14,8 +14,6 @@ info@wilbertberendsen.nl License: LGPL. """ -from __future__ import print_function, unicode_literals - import sys import re @@ -81,13 +79,13 @@ class Hyph_dict(object): """ def __init__(self, filename): self.patterns = {} - f = open(filename) + f = open(filename, 'rb') charset = f.readline().strip() - if charset.startswith('charset '): + if charset.startswith(b'charset '): charset = charset[8:].strip() for pat in f: - pat = pat.decode(charset).strip() + pat = pat.decode(charset.decode('latin1')).strip() if not pat or pat[0] == '%': continue # replace ^^hh with the real character pat = parse_hex(hexrepl, pat) @@ -211,7 +209,7 @@ class Hyphenator(object): the string 'let-ter-gre-pen'. The hyphen string to use can be given as the second parameter, that defaults to '-'. """ - if isinstance(word, str): + if isinstance(word, bytes): word = word.decode('latin1') l = list(word) for p in reversed(self.positions(word)):