From: Radek Czajka <radoslaw.czajka@nowoczesnapolska.org.pl>
Date: Tue, 8 Mar 2011 12:07:08 +0000 (+0100)
Subject: encode unicode for lxml
X-Git-Tag: 1.7~203
X-Git-Url: https://git.mdrn.pl/librarian.git/commitdiff_plain/fec62da2886e29aa0a9233e13fd9cae0ca6076bf?hp=e868b7e6511dfbb89e5a9dd69bbb7ef13c42620a

encode unicode for lxml
---

diff --git a/librarian/parser.py b/librarian/parser.py
index 4cdaa79..afc4f1a 100644
--- a/librarian/parser.py
+++ b/librarian/parser.py
@@ -61,7 +61,7 @@ class WLDocument(object):
 
         try:
             parser = etree.XMLParser(remove_blank_text=False)
-            tree = etree.parse(StringIO(data), parser)
+            tree = etree.parse(StringIO(data.encode('utf-8')), parser)
 
             if swap_endlines:
                 cls.swap_endlines(tree)