-from librarian import epub, pdf, DirDocProvider, ParseError, cover
-from librarian.dcparser import BookInfo
-
-
-def utf_trunc(text, limit):
- """ truncates text to at most `limit' bytes in utf-8 """
- if text is None:
- return text
- orig_text = text
- if len(text.encode('utf-8')) > limit:
- newlimit = limit - 3
- while len(text.encode('utf-8')) > newlimit:
- text = text[:(newlimit - len(text.encode('utf-8'))) / 4]
- text += '...'
- return text
-
-
-def virtualo(filenames, output_dir, verbose):
- xml = etree.fromstring("""<?xml version="1.0" encoding="utf-8"?>
- <products xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"></products>""")
- product = etree.fromstring("""<product>
- <publisherProductId></publisherProductId>
- <title></title>
- <info></info>
- <description></description>
- <authors>
- <author>
- <names>Jan</names>
- <lastName>Kowalski</lastName>
- </author>
- </authors>
- <price>0.0</price>
- <language>PL</language>
- </product>""")
-
- try:
- for main_input in input_filenames:
- if options.verbose:
- print main_input
- path, fname = os.path.realpath(main_input).rsplit('/', 1)
- provider = DirDocProvider(path)
- slug, ext = os.path.splitext(fname)
-
- outfile_dir = os.path.join(output_dir, slug)
- os.makedirs(os.path.join(output_dir, slug))
-
- info = BookInfo.from_file(main_input)
-
- product_elem = deepcopy(product)
- product_elem[0].text = utf_trunc(slug, 100)
- product_elem[1].text = utf_trunc(info.title, 255)
- product_elem[2].text = utf_trunc(info.description, 255)
- product_elem[3].text = utf_trunc(info.source_name, 3000)
- product_elem[4][0][0].text = utf_trunc(u' '.join(info.author.first_names), 100)
- product_elem[4][0][1].text = utf_trunc(info.author.last_name, 100)
- xml.append(product_elem)
-
- cover.VirtualoCover(
- u' '.join(info.author.first_names + (info.author.last_name,)),
- info.title
- ).save(os.path.join(outfile_dir, slug+'.jpg'))
- outfile = os.path.join(outfile_dir, '1.epub')
- outfile_sample = os.path.join(outfile_dir, '1.sample.epub')
- epub.transform(provider, file_path=main_input, output_file=outfile)
- epub.transform(provider, file_path=main_input, output_file=outfile_sample, sample=25)
- except ParseError, e:
- print '%(file)s:%(name)s:%(message)s' % {
- 'file': main_input,
- 'name': e.__class__.__name__,
- 'message': e.message
- }
-
- xml_file = open(os.path.join(output_dir, 'import_products.xml'), 'w')
- xml_file.write(etree.tostring(xml, pretty_print=True, encoding=unicode).encode('utf-8'))
- xml_file.close()
-
-
-def prestigio(filenames, output_dir, verbose):
- try:
- for main_input in input_filenames:
- if options.verbose:
- print main_input
- path, fname = os.path.realpath(main_input).rsplit('/', 1)
- provider = DirDocProvider(path)
- slug, ext = os.path.splitext(fname)
-
- if output_dir != '':
- try:
- os.makedirs(output_dir)
- except:
- pass
- outfile = os.path.join(output_dir, slug + '.epub')
- epub.transform(provider, file_path=main_input, output_file=outfile,
- cover=cover.PrestigioCover, flags=('less-advertising',))
- except ParseError, e:
- print '%(file)s:%(name)s:%(message)s' % {
- 'file': main_input,
- 'name': e.__class__.__name__,
- 'message': e.message
- }
-
-
-def prestigio_pdf(filenames, output_dir, verbose):
- try:
- for main_input in input_filenames:
- if options.verbose:
- print main_input
- path, fname = os.path.realpath(main_input).rsplit('/', 1)
- provider = DirDocProvider(path)
- slug, ext = os.path.splitext(fname)
-
- if output_dir != '':
- try:
- os.makedirs(output_dir)
- except:
- pass
- outfile = os.path.join(output_dir, slug + '.pdf')
- pdf.transform(provider, file_path=main_input, output_file=outfile,
- cover=cover.PrestigioCover, verbose=options.verbose, flags=('less-advertising',))
- except ParseError, e:
- print '%(file)s:%(name)s:%(message)s' % {
- 'file': main_input,
- 'name': e.__class__.__name__,
- 'message': e.message
- }
-
-
-def bookoteka(filenames, output_dir, verbose):