X-Git-Url: https://git.mdrn.pl/librarian.git/blobdiff_plain/102460ac788a7307391852115d8f142e6e5c3cdd..bc701e0442638cef5857b5776e30bf7362bbd580:/src/librarian/pdf.py diff --git a/src/librarian/pdf.py b/src/librarian/pdf.py index e5cf5bd..647b18f 100644 --- a/src/librarian/pdf.py +++ b/src/librarian/pdf.py @@ -196,7 +196,7 @@ def add_fundraising(doc, fundraising): naglowek.addprevious(spot) spots.append(spot) spot = etree.Element('f_spot') - doc.getroot()[-1][-1].append(spot) + doc.getroot()[-1].append(spot) spots.append(spot) e = len(spots) nfunds = len(fundraising) @@ -463,6 +463,8 @@ def load_including_children(wldoc=None, provider=None, uri=None): text = re.sub(r"([\u0400-\u04ff]+)", r"\1", text) # Geometric shapes. text = re.sub(r"([\u25a0-\u25ff]+)", r"\1", text) + # Hebrew + text = re.sub(r"([\u0590-\u05ff]+)", r"\1", text) document = WLDocument.from_bytes(text.encode('utf-8'), parse_dublincore=True, provider=provider)