fixes for edge cases
[librarian.git] / tests / test_text.py
index 70dfb60..c566a48 100644 (file)
@@ -3,32 +3,62 @@
 # This file is part of Librarian, licensed under GNU Affero GPLv3 or later.
 # Copyright © Fundacja Nowoczesna Polska. See NOTICE for more information.
 #
+from __future__ import unicode_literals
+
+import unittest
 from librarian import NoDublinCore
-from librarian.parser import WLDocument
+from librarian.builders import builders
+from librarian.parser import WLDocument as LegacyWLDocument
+from librarian.document import WLDocument
 from nose.tools import *
-from utils import get_fixture
+from .utils import get_fixture
+
+
+class TextTests(unittest.TestCase):
+    maxDiff = None
+
+    def test_transform_legacy(self):
+        expected_output_file_path = get_fixture('text', 'asnyk_miedzy_nami_expected.txt')
+
+        text = LegacyWLDocument.from_file(
+            get_fixture('text', 'miedzy-nami-nic-nie-bylo.xml')
+        ).as_text().get_bytes().decode('utf-8')
+
+        with open(expected_output_file_path, 'rb') as f:
+            self.assertEqual(text, f.read().decode('utf-8'))
+
+    def test_transform(self):
+        expected_output_file_path = get_fixture('text', 'asnyk_miedzy_nami_expected.txt')
+
+        text = WLDocument(
+            filename=get_fixture('text', 'miedzy-nami-nic-nie-bylo.xml')
+        ).build(builders['txt']).get_bytes().decode('utf-8')
 
+        with open(expected_output_file_path, 'rb') as f:
+            self.assertEqual(text, f.read().decode('utf-8'))
 
-def test_transform():
-    expected_output_file_path = get_fixture('text', 'asnyk_miedzy_nami_expected.txt')
+    
+    def test_transform_raw(self):
+        expected_output_file_path = get_fixture('text', 'asnyk_miedzy_nami_expected_raw.txt')
 
-    text = WLDocument.from_file(
+        text = LegacyWLDocument.from_file(
             get_fixture('text', 'miedzy-nami-nic-nie-bylo.xml')
-        ).as_text().get_string()
+        ).as_text(flags=['raw-text']).get_bytes().decode('utf-8')
 
-    assert_equal(text, file(expected_output_file_path).read())
+        with open(expected_output_file_path, 'rb') as f:
+            self.assertEqual(text, f.read().decode('utf-8'))
 
 
 @raises(NoDublinCore)
 def test_no_dublincore():
-    WLDocument.from_file(
+    LegacyWLDocument.from_file(
             get_fixture('text', 'asnyk_miedzy_nami_nodc.xml')
         ).as_text()
 
 
 def test_passing_parse_dublincore_to_transform():
     """Passing parse_dublincore=False to the constructor omits DublinCore parsing."""
-    WLDocument.from_file(
+    LegacyWLDocument.from_file(
             get_fixture('text', 'asnyk_miedzy_nami_nodc.xml'),
             parse_dublincore=False,
         ).as_text()