From f8228cc6712f9a71f877b0ea60719c256519f16e Mon Sep 17 00:00:00 2001 From: =?utf8?q?Marek=20St=C4=99pniowski?= Date: Mon, 15 Sep 2008 16:26:10 +0200 Subject: [PATCH] Improved some regexes. --- lib/librarian/bin/book2txt.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/lib/librarian/bin/book2txt.py b/lib/librarian/bin/book2txt.py index 86f6f1274..413ff674b 100755 --- a/lib/librarian/bin/book2txt.py +++ b/lib/librarian/bin/book2txt.py @@ -11,10 +11,10 @@ REGEXES = [ (r']*>(.|\n)*?', ''), ('<(begin|end)\\sid=[\'|"][b|e]\\d+[\'|"]\\s/>', ''), (r'(()|())', ''), - (r'[^<]*', ''), - (r'(.|\n)*?

', ''), + (r'(.|\n)*?', ''), + (r'(.|\n)*?', ''), (r'<[^>]+>', ''), - (r'/$', ''), + (r'/\n', ''), (r'---', u'—'), (r'--', u'-'), (r',,', u'„'), -- 2.20.1