Fixes for app
[wolnelektury.git] / src / catalogue / api / views.py
1 # This file is part of Wolne Lektury, licensed under GNU Affero GPLv3 or later.
2 # Copyright © Fundacja Wolne Lektury. See NOTICE for more information.
3 #
4 import json
5 import os.path
6 from urllib.request import urlopen
7 from django.conf import settings
8 from django.core.files.base import ContentFile
9 from django.http import Http404, HttpResponse, JsonResponse
10 from django.utils.decorators import method_decorator
11 from django.views.decorators.cache import never_cache
12 from django_filters import rest_framework as dfilters
13 from rest_framework import filters
14 from rest_framework.generics import (ListAPIView, RetrieveAPIView,
15                                      RetrieveUpdateAPIView, get_object_or_404)
16 from rest_framework.permissions import DjangoModelPermissionsOrAnonReadOnly
17 from rest_framework.response import Response
18 from rest_framework import status
19 from api.handlers import read_tags
20 from api.utils import vary_on_auth
21 from catalogue.forms import BookImportForm
22 from catalogue.helpers import get_top_level_related_tags
23 from catalogue.models import Book, Collection, Tag, Fragment, BookMedia
24 from catalogue.models.tag import prefetch_relations
25 from club.models import Membership
26 from club.permissions import IsClubMember
27 from sortify import sortify
28 from wolnelektury.utils import re_escape
29 from .helpers import books_after, order_books
30 from . import serializers
31
32
33 book_tag_categories = ['author', 'epoch', 'kind', 'genre']
34
35
36 class LegacyListAPIView(ListAPIView):
37     pagination_class = None
38
39
40 class CreateOnPutMixin:
41     '''
42     Creates a new model instance when PUTting a nonexistent resource.
43     '''
44     def get_object(self):
45         try:
46             return super().get_object()
47         except Http404:
48             if self.request.method == 'PUT':
49                 lookup_url_kwarg = self.lookup_url_kwarg or self.lookup_field
50                 return self.get_queryset().model(**{
51                     self.lookup_field: self.kwargs[lookup_url_kwarg]
52                 })
53             else:
54                 raise
55
56
57 class CollectionList(LegacyListAPIView):
58     queryset = Collection.objects.filter(listed=True)
59     serializer_class = serializers.CollectionListSerializer
60
61
62 @vary_on_auth  # Because of 'liked'.
63 class CollectionDetail(CreateOnPutMixin, RetrieveUpdateAPIView):
64     permission_classes = [DjangoModelPermissionsOrAnonReadOnly]
65     queryset = Collection.objects.all()
66     lookup_field = 'slug'
67     serializer_class = serializers.CollectionSerializer
68
69
70 @vary_on_auth  # Because of 'liked'.
71 class BookList(LegacyListAPIView):
72     permission_classes = [DjangoModelPermissionsOrAnonReadOnly]
73     queryset = Book.objects.none()  # Required for DjangoModelPermissions
74     serializer_class = serializers.BookListSerializer
75
76     def get(self, request, filename=None, **kwargs):
77         if filename and not kwargs.get('tags') and 'count' not in request.query_params:
78             try:
79                 with open(os.path.join(settings.MEDIA_ROOT, 'api', '%s.%s' % (filename, request.accepted_renderer.format)), 'rb') as f:
80                     content = f.read()
81                 return HttpResponse(content, content_type=request.accepted_media_type)
82             except:
83                 pass
84         return super().get(request, filename=filename, **kwargs)
85
86     def get_queryset(self):
87         try:
88             tags, ancestors = read_tags(
89                 self.kwargs.get('tags', ''), self.request,
90                 allowed=('author', 'epoch', 'kind', 'genre')
91             )
92         except ValueError:
93             raise Http404
94
95         new_api = self.request.query_params.get('new_api')
96         after = self.request.query_params.get('after', self.kwargs.get('after'))
97         count = self.request.query_params.get('count', self.kwargs.get('count'))
98         if count:
99             try:
100                 count = int(count)
101             except TypeError:
102                 raise Http404  # Fixme
103
104         if tags:
105             if self.kwargs.get('top_level'):
106                 books = Book.tagged_top_level(tags)
107                 if not books:
108                     raise Http404
109                 return books
110             else:
111                 books = Book.tagged.with_all(tags)
112         else:
113             books = Book.objects.all()
114         books = books.filter(findable=True)
115         books = order_books(books, new_api)
116
117         if not Membership.is_active_for(self.request.user):
118             books = books.exclude(preview=True)
119
120         if self.kwargs.get('top_level'):
121             books = books.filter(parent=None)
122         if self.kwargs.get('audiobooks'):
123             books = books.filter(media__type='mp3').distinct()
124         if self.kwargs.get('daisy'):
125             books = books.filter(media__type='daisy').distinct()
126         if self.kwargs.get('recommended'):
127             books = books.filter(recommended=True)
128         if self.kwargs.get('newest'):
129             books = books.order_by('-created_at')
130
131         if after:
132             books = books_after(books, after, new_api)
133
134         prefetch_relations(books, 'author')
135         prefetch_relations(books, 'genre')
136         prefetch_relations(books, 'kind')
137         prefetch_relations(books, 'epoch')
138
139         if count:
140             books = books[:count]
141
142         return books
143
144     def post(self, request, **kwargs):
145         if kwargs.get('audiobooks'):
146             return self.post_audiobook(request, **kwargs)
147         else:
148             return self.post_book(request, **kwargs)
149
150     def post_book(self, request, **kwargs):
151         data = json.loads(request.POST.get('data'))
152         form = BookImportForm(data)
153         if form.is_valid():
154             form.save()
155             return Response({}, status=status.HTTP_201_CREATED)
156         else:
157             raise Http404
158
159     def post_audiobook(self, request, **kwargs):
160         index = int(request.POST['part_index'])
161         parts_count = int(request.POST['parts_count'])
162         media_type = request.POST['type'].lower()
163         source_sha1 = request.POST.get('source_sha1')
164         name = request.POST.get('name', '')
165         part_name = request.POST.get('part_name', '')
166
167         project_description = request.POST.get('project_description', '')
168         project_icon = request.POST.get('project_icon', '')
169
170         _rest, slug = request.POST['book'].rstrip('/').rsplit('/', 1)
171         book = Book.objects.get(slug=slug)
172
173         try:
174             assert source_sha1
175             bm = book.media.get(type=media_type, source_sha1=source_sha1)
176         except (AssertionError, BookMedia.DoesNotExist):
177             bm = BookMedia(book=book, type=media_type)
178         bm.name = name
179         bm.part_name = part_name
180         bm.index = index
181         bm.project_description = project_description
182         bm.project_icon = project_icon
183         bm.file.save(None, request.data['file'], save=False)
184         bm.save(parts_count=parts_count)
185
186         return Response({}, status=status.HTTP_201_CREATED)
187
188
189 class BookFilter(dfilters.FilterSet):
190     sort = dfilters.OrderingFilter(
191         fields=(
192             ('sort_key_author', 'alpha'),
193             ('popularity', 'popularity'),
194         )
195     )
196     tag = dfilters.ModelMultipleChoiceFilter(
197         field_name='tag_relations__tag',
198         queryset=Tag.objects.filter(category__in=('author', 'epoch', 'genre', 'kind')),
199         conjoined=True,
200     )
201     translator = dfilters.ModelMultipleChoiceFilter(
202         field_name='translators',
203         queryset=Tag.objects.filter(category='author'),
204         conjoined=True,
205     )
206     has_audio = dfilters.BooleanFilter()
207
208
209 class BookList2(ListAPIView):
210     permission_classes = [DjangoModelPermissionsOrAnonReadOnly]
211     queryset = Book.objects.none()  # Required for DjangoModelPermissions
212     serializer_class = serializers.BookSerializer2
213     filter_backends = (
214         dfilters.DjangoFilterBackend,
215         filters.SearchFilter,
216     )
217     filterset_class = BookFilter
218     search_fields = [
219         'title',
220     ]
221
222     def get_queryset(self):
223         books = Book.objects.all()
224         books = books.filter(findable=True)
225         books = order_books(books, True)
226
227         return books
228
229
230 class BookRecommendationsView(ListAPIView):
231     serializer_class = serializers.BookSerializer2
232     pagination_class = None
233
234     def get_queryset(self):
235         book = get_object_or_404(
236             Book,
237             slug=self.kwargs['slug']
238         )
239         return book.get_recommended(limit=3)
240
241
242 class BookList11Labs(BookList2):
243     serializer_class = serializers.BookSerializer11Labs
244
245     def get_queryset(self):
246         books = Book.objects.all()
247         books = books.filter(findable=True)
248         books = books.filter(license='')
249         books = order_books(books, True)
250
251         return books
252
253
254 @vary_on_auth  # Because of 'liked'.
255 class BookDetail(RetrieveAPIView):
256     queryset = Book.objects.all()
257     lookup_field = 'slug'
258     serializer_class = serializers.BookDetailSerializer
259
260
261 class BookDetail2(RetrieveAPIView):
262     queryset = Book.objects.all()
263     lookup_field = 'slug'
264     serializer_class = serializers.BookSerializer2
265
266
267 class BookSyncView(RetrieveAPIView):
268     queryset = Book.objects.all()
269     lookup_field = 'slug'
270
271     def retrieve(self, request, *args, **kwargs):
272         instance = self.get_object()
273         return Response([
274             {"id": i, "timestamp": ts}
275             for (i, ts) in instance.get_sync()
276         ])
277
278     
279 @vary_on_auth  # Because of embargo links.
280 class EbookList(BookList):
281     serializer_class = serializers.EbookSerializer
282
283
284 @method_decorator(never_cache, name='dispatch')
285 class Preview(LegacyListAPIView):
286     #queryset = Book.objects.filter(preview=True)
287     serializer_class = serializers.BookPreviewSerializer
288
289     def get_queryset(self):
290         qs = Book.objects.filter(preview=True)
291         # FIXME: temporary workaround for a problem with iOS app; see #3954.
292         if 'Darwin' in self.request.META.get('HTTP_USER_AGENT', '') and 'debug' not in self.request.GET:
293             qs = qs.none()
294         return qs
295
296
297 @vary_on_auth  # Because of 'liked'.
298 class FilterBookList(LegacyListAPIView):
299     serializer_class = serializers.FilterBookListSerializer
300
301     def parse_bool(self, s):
302         if s in ('true', 'false'):
303             return s == 'true'
304         else:
305             return None
306
307     def get_queryset(self):
308         key_sep = '$'
309         search_string = self.request.query_params.get('search')
310         is_lektura = self.parse_bool(self.request.query_params.get('lektura'))
311         is_audiobook = self.parse_bool(self.request.query_params.get('audiobook'))
312         preview = self.parse_bool(self.request.query_params.get('preview'))
313         if not Membership.is_active_for(self.request.user):
314             preview = False
315
316         new_api = self.request.query_params.get('new_api')
317         after = self.request.query_params.get('after')
318         count = int(self.request.query_params.get('count', 50))
319         books = order_books(Book.objects.distinct(), new_api)
320         books = books.filter(findable=True)
321         if is_lektura is not None:
322             books = books.filter(has_audience=is_lektura)
323         if is_audiobook is not None:
324             if is_audiobook:
325                 books = books.filter(media__type='mp3')
326             else:
327                 books = books.exclude(media__type='mp3')
328         if preview is not None:
329             books = books.filter(preview=preview)
330         for category in book_tag_categories:
331             category_plural = category + 's'
332             if category_plural in self.request.query_params:
333                 slugs = self.request.query_params[category_plural].split(',')
334                 tags = Tag.objects.filter(category=category, slug__in=slugs)
335                 books = Book.tagged.with_any(tags, books)
336         if (search_string is not None) and len(search_string) < 3:
337             search_string = None
338         if search_string:
339             search_string = re_escape(search_string)
340             books_author = books.filter(cached_author__iregex=r'\m' + search_string)
341             books_title = books.filter(title__iregex=r'\m' + search_string)
342             books_title = books_title.exclude(id__in=list(books_author.values_list('id', flat=True)))
343             if after and (key_sep in after):
344                 which, key = after.split(key_sep, 1)
345                 if which == 'title':
346                     book_lists = [(books_after(books_title, key, new_api), 'title')]
347                 else:  # which == 'author'
348                     book_lists = [(books_after(books_author, key, new_api), 'author'), (books_title, 'title')]
349             else:
350                 book_lists = [(books_author, 'author'), (books_title, 'title')]
351         else:
352             if after and key_sep in after:
353                 which, key = after.split(key_sep, 1)
354                 books = books_after(books, key, new_api)
355             book_lists = [(books, 'book')]
356
357         filtered_books = []
358         for book_list, label in book_lists:
359             for category in book_tag_categories:
360                 book_list = prefetch_relations(book_list, category)
361             remaining_count = count - len(filtered_books)
362             for book in book_list[:remaining_count]:
363                 book.key = '%s%s%s' % (
364                     label, key_sep, book.slug if not new_api else book.full_sort_key())
365                 filtered_books.append(book)
366             if len(filtered_books) == count:
367                 break
368
369         return filtered_books
370
371
372 class EpubView(RetrieveAPIView):
373     queryset = Book.objects.all()
374     lookup_field = 'slug'
375     permission_classes = [IsClubMember]
376
377     @method_decorator(never_cache)
378     def get(self, *args, **kwargs):
379         return HttpResponse(self.get_object().get_media('epub'))
380
381
382 class TagCategoryView(LegacyListAPIView):
383     serializer_class = serializers.TagSerializer
384
385     def get_queryset(self):
386         category = self.kwargs['category']
387         tags = Tag.objects.filter(category=category).exclude(items=None).order_by('slug')
388
389         after = self.request.query_params.get('after')
390         count = self.request.query_params.get('count')
391         if after:
392             tags = tags.filter(slug__gt=after)
393         if count:
394             tags = tags[:count]
395
396         return tags
397
398 class AuthorList(ListAPIView):
399     serializer_class = serializers.AuthorSerializer
400     queryset = Tag.objects.filter(category='author')
401
402 class AuthorView(RetrieveAPIView):
403     serializer_class = serializers.AuthorSerializer
404     queryset = Tag.objects.filter(category='author')
405     lookup_field = 'slug'
406
407 class EpochList(ListAPIView):
408     serializer_class = serializers.EpochSerializer
409     queryset = Tag.objects.filter(category='epoch')
410
411 class EpochView(RetrieveAPIView):
412     serializer_class = serializers.EpochSerializer
413     queryset = Tag.objects.filter(category='epoch')
414     lookup_field = 'slug'
415
416 class GenreList(ListAPIView):
417     serializer_class = serializers.GenreSerializer
418     queryset = Tag.objects.filter(category='genre')
419
420 class GenreView(RetrieveAPIView):
421     serializer_class = serializers.GenreSerializer
422     queryset = Tag.objects.filter(category='genre')
423     lookup_field = 'slug'
424
425 class KindList(ListAPIView):
426     serializer_class = serializers.KindSerializer
427     queryset = Tag.objects.filter(category='kind')
428
429 class KindView(RetrieveAPIView):
430     serializer_class = serializers.KindSerializer
431     queryset = Tag.objects.filter(category='kind')
432     lookup_field = 'slug'
433
434 class ThemeList(ListAPIView):
435     serializer_class = serializers.ThemeSerializer
436     queryset = Tag.objects.filter(category='theme')
437
438 class ThemeView(RetrieveAPIView):
439     serializer_class = serializers.ThemeSerializer
440     queryset = Tag.objects.filter(category='theme')
441     lookup_field = 'slug'
442
443
444 class TagView(RetrieveAPIView):
445     permission_classes = [DjangoModelPermissionsOrAnonReadOnly]
446     serializer_class = serializers.TagDetailSerializer
447     queryset = Tag.objects.all()
448     
449     def get_object(self):
450         try:
451             return get_object_or_404(
452                 Tag,
453                 category=self.kwargs['category'],
454                 slug=self.kwargs['slug']
455             )
456         except Http404:
457             if self.request.method == 'POST':
458                 return Tag(
459                     category=self.kwargs['category'],
460                     slug=self.kwargs['slug']
461                 )
462             else:
463                 raise
464
465     def post(self, request, **kwargs):
466         data = json.loads(request.POST.get('data'))
467         fields = {
468             "name_pl": "name_pl",
469             "description_pl": "description_pl",
470             "plural": "plural",
471             "is_epoch_specific": "genre_epoch_specific",
472             "collective_noun": "collective_noun",
473             "adjective_feminine_singular": "adjective_feminine_singular",
474             "adjective_nonmasculine_plural": "adjective_nonmasculine_plural",
475             "genitive": "genitive",
476             "collective_noun": "collective_noun",
477             "gazeta_link": "gazeta_link",
478             "culturepl_link": "culturepl_link",
479             "wiki_link_pl": "wiki_link_pl",
480             "photo_attribution": "photo_attribution",
481         }
482         obj = self.get_object()
483         updated = set()
484         for data_field, model_field in fields.items():
485             value = data.get(data_field)
486             if value:
487                 if obj.category == 'author' and model_field == 'name_pl':
488                     obj.sort_key = sortify(value.lower())
489                     updated.add('sort_key')
490                     value = ' '.join(reversed([t.strip() for t in value.split(',', 1)]))
491                 setattr(obj, model_field, value)
492                 updated.add(model_field)
493         if data.get('photo'):
494             response = urlopen(data['photo'])
495             ext = response.headers.get('Content-Type', '').rsplit('/', 1)[-1]
496             obj.photo.save(
497                 "{}.{}".format(self.kwargs['slug'], ext),
498                 ContentFile(response.read()),
499                 save=False,
500             )
501             updated.add('photo')
502
503         if obj.pk:
504             obj.save(update_fields=updated, quick=True)
505         else:
506             obj.save()
507         return Response({})
508
509
510 @vary_on_auth  # Because of 'liked'.
511 class FragmentList(LegacyListAPIView):
512     serializer_class = serializers.FragmentSerializer
513
514     def get_queryset(self):
515         try:
516             tags, ancestors = read_tags(
517                 self.kwargs['tags'],
518                 self.request,
519                 allowed={'author', 'epoch', 'kind', 'genre', 'book', 'theme'}
520             )
521         except ValueError:
522             raise Http404
523         return Fragment.tagged.with_all(tags).filter(book__findable=True).select_related('book')
524
525
526 @vary_on_auth  # Because of 'liked'.
527 class FragmentView(RetrieveAPIView):
528     serializer_class = serializers.FragmentDetailSerializer
529
530     def get_object(self):
531         return get_object_or_404(
532             Fragment,
533             book__slug=self.kwargs['book'],
534             anchor=self.kwargs['anchor']
535         )
536
537
538 class SuggestedTags(ListAPIView):
539     serializer_class = serializers.FilterTagSerializer
540
541     def get_queryset(self):
542         tag_ids = self.request.GET.getlist('tag', [])
543         search = self.request.GET.get('search')
544         tags = [get_object_or_404(Tag, id=tid) for tid in tag_ids]
545         related_tags = list(t.id for t in get_top_level_related_tags(tags))
546         tags = Tag.objects.filter(id__in=related_tags)
547         if search:
548             tags = tags.filter(name__icontains=search)
549         return tags
550
551
552 class BookFragmentView(RetrieveAPIView):
553     serializer_class = serializers.FragmentSerializer2
554
555     def get_object(self):
556         book = get_object_or_404(Book, slug=self.kwargs['slug'])
557         return book.choose_fragment()
558
559
560 class BookChildrenView(ListAPIView):
561     serializer_class = serializers.BookSerializer2
562     pagination_class = None
563
564     def get_queryset(self):
565         book = get_object_or_404(Book, slug=self.kwargs['slug'])
566         return book.get_children()
567
568
569 class BookMediaView(ListAPIView):
570     serializer_class = serializers.MediaSerializer2
571     pagination_class = None
572
573     def get_queryset(self):
574         return BookMedia.objects.filter(
575             book__slug=self.kwargs['slug'],
576             type=self.kwargs['type']
577         ).order_by('index')
578
579
580 from .tojson import conv
581 from lxml import etree
582 from rest_framework.views import APIView
583
584 class BookJsonView(APIView):
585     def get(self, request, slug):
586         book = get_object_or_404(Book, slug=slug)
587         js = conv(etree.parse(book.xml_file.path))
588         return JsonResponse(js, json_dumps_params={'ensure_ascii': False})