2 # -*- coding: utf-8 -*-
4 # This file is part of Librarian, licensed under GNU Affero GPLv3 or later.
5 # Copyright © Fundacja Nowoczesna Polska. See NOTICE for more information.
9 from copy import deepcopy
10 from lxml import etree
12 from librarian import epub, DirDocProvider, ParseError, cover
13 from librarian.dcparser import BookInfo
16 def utf_trunc(text, limit):
17 """ truncates text to at most `limit' bytes in utf-8 """
21 if len(text.encode('utf-8')) > limit:
23 while len(text.encode('utf-8')) > newlimit:
24 text = text[:(newlimit - len(text.encode('utf-8'))) / 4]
29 def virtualo(filenames, output_dir, verbose):
30 xml = etree.fromstring("""<?xml version="1.0" encoding="utf-8"?>
31 <products xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"></products>""")
32 product = etree.fromstring("""<product>
33 <publisherProductId></publisherProductId>
36 <description></description>
40 <lastName>Kowalski</lastName>
44 <language>PL</language>
48 for main_input in input_filenames:
51 path, fname = os.path.realpath(main_input).rsplit('/', 1)
52 provider = DirDocProvider(path)
53 slug, ext = os.path.splitext(fname)
55 outfile_dir = os.path.join(output_dir, slug)
56 os.makedirs(os.path.join(output_dir, slug))
58 info = BookInfo.from_file(main_input)
60 product_elem = deepcopy(product)
61 product_elem[0].text = utf_trunc(slug, 100)
62 product_elem[1].text = utf_trunc(info.title, 255)
63 product_elem[2].text = utf_trunc(info.description, 255)
64 product_elem[3].text = utf_trunc(info.source_name, 3000)
65 product_elem[4][0][0].text = utf_trunc(u' '.join(info.author.first_names), 100)
66 product_elem[4][0][1].text = utf_trunc(info.author.last_name, 100)
67 xml.append(product_elem)
70 u' '.join(info.author.first_names + (info.author.last_name,)),
72 ).save(os.path.join(outfile_dir, slug+'.jpg'))
73 outfile = os.path.join(outfile_dir, '1.epub')
74 outfile_sample = os.path.join(outfile_dir, '1.sample.epub')
75 epub.transform(provider, file_path=main_input, output_file=outfile)
76 epub.transform(provider, file_path=main_input, output_file=outfile_sample, sample=25)
78 print '%(file)s:%(name)s:%(message)s' % {
80 'name': e.__class__.__name__,
84 xml_file = open(os.path.join(output_dir, 'import_products.xml'), 'w')
85 xml_file.write(etree.tostring(xml, pretty_print=True, encoding=unicode).encode('utf-8'))
89 def prestigio(filenames, output_dir, verbose):
91 for main_input in input_filenames:
94 path, fname = os.path.realpath(main_input).rsplit('/', 1)
95 provider = DirDocProvider(path)
96 slug, ext = os.path.splitext(fname)
100 os.makedirs(output_dir)
103 outfile = os.path.join(output_dir, slug + '.epub')
104 epub.transform(provider, file_path=main_input, output_file=outfile,
105 cover_fn=cover.prestigio_cover, flags=('less-advertising',))
106 except ParseError, e:
107 print '%(file)s:%(name)s:%(message)s' % {
109 'name': e.__class__.__name__,
115 if __name__ == '__main__':
116 # Parse commandline arguments
117 usage = """Usage: %prog [options] SOURCE [SOURCE...]
118 Prepare SOURCE files for a partner."""
120 parser = optparse.OptionParser(usage=usage)
122 parser.add_option('-v', '--verbose', action='store_true', dest='verbose', default=False,
123 help='print status messages to stdout')
124 parser.add_option('-O', '--output-dir', dest='output_dir', metavar='DIR', default='',
125 help='specifies the directory for output')
126 parser.add_option('--virtualo', action='store_true', dest='virtualo', default=False,
127 help='prepare files for Virtualo API')
128 parser.add_option('--prestigio', action='store_true', dest='prestigio', default=False,
129 help='prepare files for prestigio')
131 options, input_filenames = parser.parse_args()
133 if len(input_filenames) < 1:
138 virtualo(input_filenames, options.output_dir, options.verbose)
139 if options.prestigio:
140 prestigio(input_filenames, options.output_dir, options.verbose)