X-Git-Url: https://git.mdrn.pl/audio.git/blobdiff_plain/c7d2e4daae13c7c1100ec0d42ace0e8c34b5ae24..d34100c7ed69f83e552ec589fd0c353129165452:/src/archive/models.py diff --git a/src/archive/models.py b/src/archive/models.py index 4a1d763..869641c 100644 --- a/src/archive/models.py +++ b/src/archive/models.py @@ -1,19 +1,35 @@ +import io +import json import os.path from django.db import models from time import sleep -from django.utils.encoding import force_bytes -from django.utils.translation import ugettext_lazy as _ +from django.utils.functional import cached_property +from django.utils.timezone import now +from django.utils.translation import gettext_lazy as _ +from django_pglocks import advisory_lock +import requests from archive.constants import status -from archive.settings import FILES_SAVE_PATH, ADVERT, LICENSE, ORGANIZATION, PROJECT +from archive.settings import FILES_SAVE_PATH, ADVERT, ORGANIZATION, PROJECT from archive.utils import OverwriteStorage, sha1_file +class License(models.Model): + uri = models.CharField(max_length=255, unique=True) + name = models.CharField(max_length=255) + + def __str__(self): + return self.name + + class Project(models.Model): """ an audiobook project, needed for specyfing sponsors """ name = models.CharField(max_length=128, unique=True, db_index=True, verbose_name="Nazwa") sponsors = models.TextField(blank=True, null=True, verbose_name="Sponsorzy") + description = models.TextField(blank=True, verbose_name="Opis") + youtube = models.ForeignKey('youtube.YouTube', models.PROTECT) + icon = models.FileField(upload_to='archive/project', blank=True, null=True) class Meta: verbose_name = _("project") @@ -23,6 +39,14 @@ class Project(models.Model): def __str__(self): return self.name + def get_description(self): + if self.description: + return self.description + return "Audiobook nagrany w ramach projektu %s%s." % ( + self.name, + " finansowanego przez %s" % self.sponsors if self.sponsors else "", + ) + def source_upload_to(intance, filename): return os.path.join(FILES_SAVE_PATH, filename) # FIXME: what about really long file names? @@ -32,20 +56,29 @@ class Audiobook(models.Model): source_file = models.FileField(upload_to=source_upload_to, max_length=255, verbose_name=_('source file'), editable=False) source_sha1 = models.CharField(max_length=40, editable=False) + duration = models.FloatField(null=True, editable=False) title = models.CharField(max_length=255, verbose_name=_('title')) part_name = models.CharField(max_length=255, verbose_name=_('part name'), help_text=_('eg. chapter in a novel'), default='', blank=True) - index = models.IntegerField(verbose_name=_('index'), default=0) - parts_count = models.IntegerField(verbose_name=_('parts count'), default=1) + index = models.IntegerField(verbose_name=_('index'), default=0, help_text=_('Ordering of parts of a book.')) + youtube_volume = models.CharField( + _("Volume name for YouTube"), + max_length=100, + blank=True, + help_text=_( + "If set, audiobooks with the save value will be published as single YouTube video." + ), + ) artist = models.CharField(max_length=255, verbose_name=_('artist')) conductor = models.CharField(max_length=255, verbose_name=_('conductor')) encoded_by = models.CharField(max_length=255, verbose_name=_('encoded by')) date = models.CharField(max_length=255, verbose_name=_('date')) - project = models.ForeignKey(Project, verbose_name=_('project')) - url = models.URLField(max_length=255, verbose_name=_('book url')) + project = models.ForeignKey(Project, models.PROTECT, verbose_name=_('project')) + slug = models.SlugField(max_length=120, blank=True, help_text=_('WL catalogue slug of the book.')) translator = models.CharField(max_length=255, null=True, blank=True, verbose_name=_('translator')) modified = models.DateTimeField(null=True, editable=False) + license = models.ForeignKey(License, models.PROTECT, null=True, blank=True, verbose_name=_('license')) # publishing process mp3_status = models.SmallIntegerField(null=True, editable=False, choices=status.choices) @@ -62,6 +95,14 @@ class Audiobook(models.Model): ogg_published_tags = models.TextField(null=True, editable=False) ogg_published = models.DateTimeField(null=True, editable=False) + youtube_status = models.SmallIntegerField(null=True, editable=False, choices=status.choices) + youtube_task = models.CharField(max_length=64, null=True, editable=False) + youtube_tags = models.TextField(null=True, editable=False) + youtube_published_tags = models.TextField(null=True, editable=False) + youtube_published = models.DateTimeField(null=True, editable=False) + youtube_id = models.CharField(max_length=255, blank=True, default='') + youtube_queued = models.DateTimeField(null=True, blank=True) + class Meta: verbose_name = _("audiobook") verbose_name_plural = _("audiobooks") @@ -70,6 +111,50 @@ class Audiobook(models.Model): def __str__(self): return self.title + @property + def url(self): + return f'https://wolnelektury.pl/katalog/lektura/{self.slug}/' + + @property + def parts_count(self): + return type(self).objects.filter(slug=self.slug).count() + + @property + def youtube_volume_count(self): + total = 0 + prev_volume = None + for a in type(self).objects.filter(slug=self.slug).order_by("index"): + if not a.youtube_volume or a.youtube_volume != prev_volume: + total += 1 + prev_volume = a.youtube_volume + return total + + @property + def youtube_volume_index(self): + index = 0 + prev_volume = None + for a in type(self).objects.filter(slug=self.slug, index__lte=self.index).order_by("index"): + if not a.youtube_volume or a.youtube_volume != prev_volume: + index += 1 + prev_volume = a.youtube_volume + return index + + @property + def is_youtube_publishable(self): + return ( + not self.youtube_volume + or not type(self) + .objects.filter(youtube_volume=self.youtube_volume, index__lt=self.index) + .exists() + ) + + def youtube_publish(self): + if not self.is_youtube_publishable: + return False + self.youtube_status = status.QUEUED + self.youtube_queued = now() + self.save(update_fields=['youtube_status', 'youtube_queued']) + def get_mp3_tags(self): return json.loads(self.mp3_tags) if self.mp3_tags else None def get_ogg_tags(self): return json.loads(self.ogg_tags) if self.ogg_tags else None def get_mp3_published_tags(self): return json.loads(self.mp3_published_tags) if self.mp3_published_tags else None @@ -81,41 +166,29 @@ class Audiobook(models.Model): return self.mp3_published and self.ogg_published def get_source_sha1(self): - source_sha1 = self.source_sha1 - if self.pk: - source_sha1 = type(self).objects.get(pk=self.pk).source_sha1 - while source_sha1 == 'wait': - sleep(10) - if not source_sha1: - self.source_sha1 = 'wait' - if self.pk: - type(self).objects.filter(pk=self.pk).update(source_sha1='wait') - try: - f = open(force_bytes(self.source_file.path)) - source_sha1 = sha1_file(f) - self.source_sha1 = source_sha1 - if self.pk: - type(self).objects.filter(pk=self.pk).update(source_sha1=source_sha1) - except: - self.source_sha1 = '' - if self.pk: - type(self).objects.filter(pk=self.pk).update(source_sha1='') - return None - return source_sha1 - + assert self.pk or self.source_sha1 + if not self.source_sha1: + with advisory_lock(f'get_source_sha1_{self.pk}'): + with open(self.source_file.path, 'rb') as f: + self.source_sha1 = sha1_file(f) + self.save(update_fields=['source_sha1']) + return self.source_sha1 def new_publish_tags(self): title = self.title if self.translator: title += ' (tłum. %s)' % self.translator - copyright = "%s %s. Licensed to the public under %s verify at %s" % ( - self.date, ORGANIZATION, LICENSE, self.url) + copyright = "%s %s." % ( + self.date, ORGANIZATION) + if self.license: + copyright += " Licensed to the public under %s verify at %s" % ( + self.license.uri, self.url) - comment = "Audiobook nagrany w ramach projektu %s%s.\n%s" % ( - self.project.name, - " finansowanego przez %s" % self.project.sponsors if self.project.sponsors else "", - ADVERT) + comment = "\n".join(( + self.project.get_description(), + ADVERT + )) tags = { 'album': PROJECT, @@ -128,14 +201,41 @@ class Audiobook(models.Model): 'date': self.date, 'genre': 'Speech', 'language': 'pol', - 'license': LICENSE, 'organization': ORGANIZATION, 'title': title, - #'flac_sha1': self.get_source_sha1(), 'project': self.project.name, - 'funded_by': self.project.sponsors, } - if self.source_sha1 and self.source_sha1 != 'wait': + if self.license: + tags['license'] = self.license.uri + if self.project.sponsors: + tags['funded_by'] = self.project.sponsors + + if self.source_sha1: tags['flac_sha1'] = self.source_sha1 return tags + @cached_property + def book(self): + if self.slug: + apidata = requests.get(f'https://wolnelektury.pl/api/books/{self.slug}/').json() + else: + return {} + return apidata + + @property + def document(self): + from librarian.document import WLDocument, parser + from lxml import etree + + xml_url = self.book.get('xml', None) + if xml_url is None: + return None + + return WLDocument( + etree.parse( + io.BytesIO( + requests.get(xml_url).content + ) + ,parser = parser + ) + )