1 from datetime import date
6 from django.conf import settings
7 from django.utils.html import escape, format_html
8 from django.utils.safestring import mark_safe
9 from librarian.builders.html import SnippetHtmlBuilder
10 from librarian.functions import lang_code_3to2
11 from catalogue.models import Audience, Author, Thema
13 from .base import BasePublisher
14 from .woblink_constants import WOBLINK_CATEGORIES
17 class WoblinkError(ValueError):
20 class NoPrice(WoblinkError):
23 'Brak <a href="/admin/depot/site/{site}">określonej ceny</a>.',
27 class NoIsbn(WoblinkError):
31 class AuthorLiteralForeign(WoblinkError):
34 'Nie obsługiwane: autor „{author}” w języku {lang}.',
35 author=str(self.args[0]),
36 lang=self.args[0].lang,
39 class AuthorNotInCatalogue(WoblinkError):
42 'Brak autora „{author}” w katalogu.',
43 author=str(self.args[0])
46 class AuthorNoWoblink(WoblinkError):
49 'Autor <a href="/admin/catalogue/author/{author_id}/">{author}</a> bez identyfikatora Woblink.',
50 author_id=self.args[0].id,
51 author=self.args[0].name
54 class NoThema(WoblinkError):
56 return format_html('Brak Thema.')
58 class UnknownThema(WoblinkError):
61 'Nieznana Thema {code}.',
66 class ThemaUnknownWoblink(WoblinkError):
69 'Thema <a href="/admin/catalogue/thema/{id}/">{code}</a> przypisana do nieznanej kategorii Woblink.',
71 code=self.args[0].code,
74 class NoWoblinkCategory(WoblinkError):
76 return 'Brak kategorii Woblink.'
78 class WoblinkWarning(Warning):
81 class NoMainThemaWarning(WoblinkWarning):
84 'Brak głównej kategorii Thema.'
87 class ThemaNoWoblink(WoblinkWarning):
90 'Thema <a href="/admin/catalogue/thema/{id}/">{code}</a> nie przypisana do kategorii Woblink.',
92 code=self.args[0].code,
95 class AuthorLiteralForeignWarning(WoblinkWarning):
98 'Nie obsługiwane: autor „{author}” w języku {lang}.',
99 author=str(self.args[0]),
100 lang=self.args[0].lang,
103 class AuthorNotInCatalogueWarning(WoblinkWarning):
106 'Brak autora „{author}” w katalogu.',
107 author=str(self.args[0])
110 class AuthorNoWoblinkWarning(WoblinkWarning):
113 'Autor <a href="/admin/catalogue/author/{author_id}/">{author}</a> bez identyfikatora Woblink.',
114 author_id=self.args[0].id,
115 author=self.args[0].name
121 class Woblink(BasePublisher):
122 BASE_URL = 'https://publisher.woblink.com/'
123 ADD_URL = BASE_URL + 'catalog/add'
124 STEP1_URL = BASE_URL + 'catalog/edit/%s'
125 STEP2_URL = BASE_URL + 'catalog/edit/%s/2'
126 STEP3_URL = BASE_URL + 'catalog/edit/%s/3'
127 STEP4_URL = BASE_URL + 'catalog/edit/%s/4'
128 STEP5_URL = BASE_URL + 'catalog/edit/%s/5'
129 UPLOAD_URL = BASE_URL + 'file/upload-%s'
130 JOB_STATUS_URL = BASE_URL + 'task/status'
131 GENERATE_DEMO_URL = BASE_URL + 'task/run/generate-%s-demo/%s/%d'
132 CHECK_DEMO_URL = BASE_URL + 'task/run/check-%s-demo/%s'
134 SEARCH_CATALOGUE_URL = BASE_URL + '{category}/autocomplete/{term}'
140 response = self.session.get('https://publisher.woblink.com/login')
142 r'name="_csrf_token" value="([^"]+)"',
146 '_csrf_token': token,
147 '_username': self.username,
148 '_password': self.password,
150 response = self.session.post(
151 'https://publisher.woblink.com/login_check',
155 def search_catalogue(self, category, term):
156 return self.session.get(
157 self.SEARCH_CATALOGUE_URL.format(category=category, term=term)
160 def search_author_catalogue(self, term):
164 'text': item['autFullname']
166 for item in self.search_catalogue('author', term)
168 def search_series_catalogue(self, term):
174 for item in self.search_catalogue('series', term)
177 def get_isbn(self, meta, errors=None):
178 if not meta.isbn_epub:
179 if errors is not None:
180 errors.append(NoIsbn())
181 return meta.isbn_epub
183 def get_authors_data(self, meta, errors=None):
185 for role, items, obligatory in [
186 (self.ROLE_AUTHOR, meta.authors, True),
187 (self.ROLE_TRANSLATOR, meta.translators, False)
189 for person_literal in items:
190 if person_literal.lang != 'pl':
191 if errors is not None:
193 errors.append(AuthorLiteralForeign(person_literal))
195 errors.append(AuthorLiteralForeignWarning(person_literal))
197 aobj = Author.get_by_literal(str(person_literal))
199 if errors is not None:
201 errors.append(AuthorNotInCatalogue(person_literal))
203 errors.append(AuthorNotInCatalogueWarning(person_literal))
206 if errors is not None:
208 errors.append(AuthorNoWoblink(aobj))
210 errors.append(AuthorNoWoblinkWarning(aobj))
212 authors.append((role, aobj.woblink))
215 def get_genres(self, meta, errors=None):
218 thema_codes.append(meta.thema_main)
220 if errors is not None:
221 errors.append(NoMainThemaWarning())
222 thema_codes.extend(meta.thema)
225 Audience.objects.filter(code__in=meta.audiences).exclude(
226 thema='').values_list('thema', flat=True)
230 if errors is not None:
231 errors.append(NoThema())
233 for code in thema_codes:
235 thema = Thema.objects.get(code=code)
236 except Thema.DoesNotExist:
237 if errors is not None:
238 errors.append(UnknownThema(code))
240 if thema.woblink_category is None:
241 if errors is not None:
242 errors.append(ThemaNoWoblink(thema))
243 elif thema.woblink_category not in WOBLINK_CATEGORIES:
244 if errors is not None:
245 errors.append(ThemaUnknownWoblink(thema))
246 elif thema.woblink_category not in category_ids:
247 category_ids.append(thema.woblink_category)
249 if errors is not None:
250 errors.append(NoWoblinkCategory())
253 def get_series(self, meta, errors=None):
254 return list(Audience.objects.filter(code__in=meta.audiences).exclude(
255 woblink=None).values_list('woblink', flat=True))
257 def get_abstract(self, wldoc, errors=None, description_add=None):
258 description = self.get_description(wldoc, description_add)
259 parts = description.split('\n', 1)
260 if len(parts) == 1 or len(parts[0]) > 240:
261 # No newline found here.
262 # Try to find last sentence end..
263 parts = re.split(r' \.', description[240::-1], 1)
265 p1 = parts[1][::-1] + '.'
266 p2 = description[len(p1) + 1:]
268 # No sentence end found.
270 p1 = description[:240].rsplit(' ', 1)[0]
271 p2 = description[len(p1) + 1:]
276 m = re.search(r'<[^>]+$', parts[0])
278 parts[0] = parts[0][:-len(m.group(0))]
279 parts[1] = m.group(0) + parts[1]
282 for tag in re.findall(r'<[^>]*[^/>]>', parts[0]):
287 for tag in reversed(opened):
288 parts[0] += '</' + tag[1:-1].split()[0] + '>'
289 parts[1] = tag + parts[1]
295 def get_lang2code(self, meta, errors=None):
296 return lang_code_3to2(meta.language)
298 def get_price(self, site, wldoc, errors=None):
300 stats = wldoc.get_statistics()['total']
303 errors.append(NoPrice(site))
305 words = stats['words_with_fn']
306 pages = stats['chars_with_fn'] / 1800
307 price = site.get_price(words, pages)
310 errors.append(NoPrice(site))
315 def can_publish(self, site, book):
322 wldoc = book.wldocument(librarian2=True)
324 d['errors'].append('Nieprawidłowy dokument.')
327 book_data = self.get_book_data(site, wldoc, errors)
329 if not isinstance(error, Warning):
330 errlist = d['errors']
332 errlist = d['warnings']
333 errlist.append(error.as_html())
335 if book_data.get('isbn'):
336 d['info'].append(format_html(
338 isbn=book_data['isbn'],
341 if book_data.get('genres'):
342 d['info'].append(format_html(
343 'W kategoriach: {cat} ({price} zł)',
344 cat=', '.join(self.describe_category(g) for g in book_data['genres']),
345 price=book_data['price'],
347 d['info'].append(mark_safe(
348 '<strong>' + book_data['abstract']['header'] +
349 '</strong><br/>' + book_data['abstract']['rest']
354 def describe_category(self, category):
357 c = WOBLINK_CATEGORIES[category]
359 category = c.get('parent')
360 return ' / '.join(reversed(t))
362 def create_book(self, isbn):
363 isbn = ''.join(c for c in isbn if c.isdigit())
364 assert len(isbn) == 13
365 response = self.session.post(
368 'AddPublication[pubType]': 'ebook',
369 'AddPublication[pubHasIsbn]': '1',
370 'AddPublication[pubIsbn]': isbn,
374 m = re.search(r'/(\d+)$', response.url)
378 def send_book(self, site_book_publish, changes=None):
379 site_book = site_book_publish.site_book
380 book = site_book.book
381 site = site_book.site
382 wldoc = book.wldocument(librarian2=True, changes=changes, publishable=False) # TODO pub
385 book_data = self.get_book_data(site, wldoc)
387 if not site_book.external_id:
388 woblink_id = self.create_book(book_data['isbn'])
390 site_book.external_id = woblink_id
391 site_book.save(update_fields=['external_id'])
392 woblink_id = site_book.external_id
394 self.edit_step1(woblink_id, book_data)
395 self.edit_step2(woblink_id, book_data)
396 self.edit_step3(woblink_id, book_data)
397 cover_id = self.send_cover(woblink_id, wldoc)
399 texts = site.get_texts()
400 epub_id, epub_demo = self.send_epub(
401 woblink_id, wldoc, book.gallery_path(),
404 mobi_id, mobi_demo = self.send_mobi(
405 woblink_id, wldoc, book.gallery_path(),
409 woblink_id, book_data,
410 cover_id, epub_id, epub_demo, mobi_id, mobi_demo,
412 self.edit_step5(woblink_id, book_data)
414 def get_book_data(self, site, wldoc, errors=None):
416 "title": wldoc.meta.title,
417 "isbn": self.get_isbn(wldoc.meta, errors=errors),
418 "authors": self.get_authors_data(wldoc.meta, errors=errors),
419 "abstract": self.get_abstract(
420 wldoc, errors=errors, description_add=site.description_add
422 "lang2code": self.get_lang2code(wldoc.meta, errors=errors),
423 "genres": self.get_genres(wldoc.meta, errors=errors),
424 "price": self.get_price(site, wldoc, errors=errors),
425 "series": self.get_series(wldoc.meta, errors=errors),
428 def with_form_name(self, data, name):
431 for (k, v) in data.items()
434 def edit_step1(self, woblink_id, book_data):
439 "AhpPubId": woblink_id,
440 "AhpAutId": author_id,
441 "AhpType": author_type,
443 for (author_type, author_id) in data['authors']
448 'PublicationId': woblink_id,
449 'SeriesId': series_id,
451 for series_id in data['series']
455 'pubTitle': book_data['title'],
456 'npwAuthorHasPublications': json.dumps(authors_data),
457 'pubShortNote': data['abstract']['header'],
458 'pubNote': data['abstract']['rest'],
459 'pubCulture': data['lang2code'],
460 'npwPublicationHasAwards': '[]',
461 'npwPublicationHasSeriess': json.dumps(series_data),
463 d = self.with_form_name(d, 'EditPublicationStep1')
464 d['roles'] = [author_type for (author_type, author_id) in data['authors']]
465 r = self.session.post(self.STEP1_URL % woblink_id, data=d)
469 def edit_step2(self, woblink_id, book_data):
472 for i, g in enumerate(book_data['genres']):
473 gdata = WOBLINK_CATEGORIES[g]
475 legacy = gdata.get('legacy')
476 if p := gdata.get('parent'):
477 gd.setdefault(p, {'isMain': False})
478 gd[p].setdefault('children', [])
479 gd[p]['children'].append(str(g))
480 gd[p].setdefault('mainChild', str(g))
482 legacy = WOBLINK_CATEGORIES[p].get('legacy')
485 gd[g]['isMain'] = True
492 for k, v in gd.items()
496 'npwPublicationHasNewGenres': json.dumps(gd),
497 'genre': legacy or '',
499 data = self.with_form_name(data, 'AddPublicationStep2')
500 return self.session.post(self.STEP2_URL % woblink_id, data=data)
502 def edit_step3(self, woblink_id, book_data):
504 'pubBasePrice': book_data['price'],
505 'pubPremiereDate': date.today().isoformat(),
506 'pubIsLicenseIndefinite': '1',
507 'pubFileFormat': 'epub+mobi',
509 'pubPublisherIndex': '',
510 'save_and_continue': '',
512 d = self.with_form_name(d, 'EditPublicationStep3')
513 return self.session.post(self.STEP3_URL % woblink_id, data=d)
515 def edit_step4(self, woblink_id, book_data, cover_id, epub_id, epub_demo, mobi_id, mobi_demo):
517 'pubCoverResId': cover_id,
518 'pubEpubResId': epub_id,
519 'pubEpubDemoResId': epub_demo,
520 'pubMobiResId': mobi_id,
521 'pubMobiDemoResId': mobi_demo,
522 'pubFileFormat': 'epub+mobi',
524 'save_and_continue': '',
526 d = self.with_form_name(d, 'EditPublicationStep4')
527 return self.session.post(self.STEP4_URL % woblink_id, data=d)
529 def edit_step5(self, woblink_id, book_data):
531 d = self.with_form_name(d, 'EditPublicationStep5')
532 return self.session.post(self.STEP5_URL % woblink_id, data=d)
534 def wait_for_job(self, job_id):
536 response = self.session.post(
538 data={'ids[]': job_id}
540 data = response.json()[job_id]
542 assert data['successful']
543 return data.get('returnValue')
546 def upload_file(self, woblink_id, filename, content, field_name, mime_type):
547 form_name = f'Upload{field_name}'
548 id_field = f'pub{field_name}ResId'
549 field_name = field_name.lower()
555 field_name: (filename, content, mime_type)
558 response = self.session.post(
559 self.UPLOAD_URL % field_name,
560 data=self.with_form_name(data, form_name),
561 files=self.with_form_name(files, form_name),
563 resp_data = response.json()
564 assert resp_data['success'] is True
565 file_id = resp_data[id_field]
566 if 'jobId' in resp_data:
567 self.wait_for_job(resp_data['jobId'])
570 def generate_demo(self, woblink_id, file_format, check=True):
573 job_id = self.session.get(
574 self.GENERATE_DEMO_URL % (file_format, woblink_id, percent),
577 file_id = self.wait_for_job(job_id)
581 self.CHECK_DEMO_URL % (file_format, woblink_id)
584 except AssertionError:
594 def send_epub(self, woblink_id, doc, gallery_path, fundraising=None):
595 from librarian.builders import EpubBuilder
596 content = EpubBuilder(
597 base_url='file://' + gallery_path + '/',
598 fundraising=fundraising or [],
599 ).build(doc).get_file()
600 file_id = self.upload_file(
602 doc.meta.url.slug + '.epub',
605 'application/epub+zip'
607 demo_id = self.generate_demo(woblink_id, 'epub')
608 return file_id, demo_id
610 def send_mobi(self, woblink_id, doc, gallery_path, fundraising=None):
611 from librarian.builders import MobiBuilder
612 content = MobiBuilder(
613 base_url='file://' + gallery_path + '/',
614 fundraising=fundraising or [],
615 ).build(doc).get_file()
616 file_id = self.upload_file(
618 doc.meta.url.slug + '.mobi',
621 'application/x-mobipocket-ebook'
623 demo_id = self.generate_demo(woblink_id, 'mobi', check=False)
624 return file_id, demo_id
626 def send_cover(self, woblink_id, doc):
627 from librarian.cover import make_cover
630 cover = make_cover(doc.meta, cover_class='m-label', width=1748, height=2480)
631 content = io.BytesIO()
632 cover.final_image().save(content, cover.format)
634 file_id = self.upload_file(
636 doc.meta.url.slug + '.jpeg',