X-Git-Url: https://git.mdrn.pl/wolnelektury.git/blobdiff_plain/239d66922f4b83ee5baaa284a9c33a32bfcb99a4..648dff98814d2ddeda2f06a8c0e2fb01547fac2a:/bin/book2html.py diff --git a/bin/book2html.py b/bin/book2html.py deleted file mode 100755 index 5bd2bb527..000000000 --- a/bin/book2html.py +++ /dev/null @@ -1,55 +0,0 @@ -#!/usr/bin/env python -# -*- coding: utf-8 -*- -import cStringIO -import re -import optparse -import os -import sys - -from lxml import etree - - -# Parse args -usage = """Usage: %prog [options] SOURCE [SOURCE...] -Convert SOURCE files to HTML format.""" - -parser = optparse.OptionParser(usage=usage) - -parser.add_option('-v', '--verbose', action='store_true', dest='verbose', default=False, - help='print status messages to stdout') - -options, input_filenames = parser.parse_args() - -if len(input_filenames) < 1: - parser.print_help() - exit(1) - -# Parse XSLT -style = etree.parse('book2html.xslt') - -# Do some real work -for input_filename in input_filenames: - if options.verbose: - print input_filename - - output_filename = os.path.splitext(input_filename)[0] + '.html' - - # Transform - doc_file = cStringIO.StringIO() - expr = re.compile(r'/\s', re.MULTILINE | re.UNICODE); - - f = open(input_filename, 'r') - for line in f: - line = line.decode('utf-8') - line = expr.sub(u'
\n', line).replace(u'---', u'—').replace(u',,', u'„') - doc_file.write(line.encode('utf-8')) - f.close() - - doc_file.seek(0); - - parser = etree.XMLParser(remove_blank_text=True) - doc = etree.parse(doc_file, parser) - - result = doc.xslt(style) - result.write(output_filename, xml_declaration=True, pretty_print=True, encoding='utf-8') -