filters api
[wolnelektury.git] / src / catalogue / api / views.py
1 # This file is part of Wolne Lektury, licensed under GNU Affero GPLv3 or later.
2 # Copyright © Fundacja Wolne Lektury. See NOTICE for more information.
3 #
4 import json
5 import os.path
6 from urllib.request import urlopen
7 from django.conf import settings
8 from django.core.files.base import ContentFile
9 from django.http import Http404, HttpResponse
10 from django.utils.decorators import method_decorator
11 from django.views.decorators.cache import never_cache
12 from django_filters import rest_framework as dfilters
13 from rest_framework import filters
14 from rest_framework.generics import (ListAPIView, RetrieveAPIView,
15                                      RetrieveUpdateAPIView, get_object_or_404)
16 from rest_framework.permissions import DjangoModelPermissionsOrAnonReadOnly
17 from rest_framework.response import Response
18 from rest_framework import status
19 from api.handlers import read_tags
20 from api.utils import vary_on_auth
21 from catalogue.forms import BookImportForm
22 from catalogue.helpers import get_top_level_related_tags
23 from catalogue.models import Book, Collection, Tag, Fragment, BookMedia
24 from catalogue.models.tag import prefetch_relations
25 from club.models import Membership
26 from club.permissions import IsClubMember
27 from sortify import sortify
28 from wolnelektury.utils import re_escape
29 from .helpers import books_after, order_books
30 from . import serializers
31
32
33 book_tag_categories = ['author', 'epoch', 'kind', 'genre']
34
35
36 class LegacyListAPIView(ListAPIView):
37     pagination_class = None
38
39
40 class CreateOnPutMixin:
41     '''
42     Creates a new model instance when PUTting a nonexistent resource.
43     '''
44     def get_object(self):
45         try:
46             return super().get_object()
47         except Http404:
48             if self.request.method == 'PUT':
49                 lookup_url_kwarg = self.lookup_url_kwarg or self.lookup_field
50                 return self.get_queryset().model(**{
51                     self.lookup_field: self.kwargs[lookup_url_kwarg]
52                 })
53             else:
54                 raise
55
56
57 class CollectionList(LegacyListAPIView):
58     queryset = Collection.objects.filter(listed=True)
59     serializer_class = serializers.CollectionListSerializer
60
61
62 @vary_on_auth  # Because of 'liked'.
63 class CollectionDetail(CreateOnPutMixin, RetrieveUpdateAPIView):
64     permission_classes = [DjangoModelPermissionsOrAnonReadOnly]
65     queryset = Collection.objects.all()
66     lookup_field = 'slug'
67     serializer_class = serializers.CollectionSerializer
68
69
70 @vary_on_auth  # Because of 'liked'.
71 class BookList(LegacyListAPIView):
72     permission_classes = [DjangoModelPermissionsOrAnonReadOnly]
73     queryset = Book.objects.none()  # Required for DjangoModelPermissions
74     serializer_class = serializers.BookListSerializer
75
76     def get(self, request, filename=None, **kwargs):
77         if filename and not kwargs.get('tags') and 'count' not in request.query_params:
78             try:
79                 with open(os.path.join(settings.MEDIA_ROOT, 'api', '%s.%s' % (filename, request.accepted_renderer.format)), 'rb') as f:
80                     content = f.read()
81                 return HttpResponse(content, content_type=request.accepted_media_type)
82             except:
83                 pass
84         return super().get(request, filename=filename, **kwargs)
85
86     def get_queryset(self):
87         try:
88             tags, ancestors = read_tags(
89                 self.kwargs.get('tags', ''), self.request,
90                 allowed=('author', 'epoch', 'kind', 'genre')
91             )
92         except ValueError:
93             raise Http404
94
95         new_api = self.request.query_params.get('new_api')
96         after = self.request.query_params.get('after', self.kwargs.get('after'))
97         count = self.request.query_params.get('count', self.kwargs.get('count'))
98         if count:
99             try:
100                 count = int(count)
101             except TypeError:
102                 raise Http404  # Fixme
103
104         if tags:
105             if self.kwargs.get('top_level'):
106                 books = Book.tagged_top_level(tags)
107                 if not books:
108                     raise Http404
109                 return books
110             else:
111                 books = Book.tagged.with_all(tags)
112         else:
113             books = Book.objects.all()
114         books = books.filter(findable=True)
115         books = order_books(books, new_api)
116
117         if not Membership.is_active_for(self.request.user):
118             books = books.exclude(preview=True)
119
120         if self.kwargs.get('top_level'):
121             books = books.filter(parent=None)
122         if self.kwargs.get('audiobooks'):
123             books = books.filter(media__type='mp3').distinct()
124         if self.kwargs.get('daisy'):
125             books = books.filter(media__type='daisy').distinct()
126         if self.kwargs.get('recommended'):
127             books = books.filter(recommended=True)
128         if self.kwargs.get('newest'):
129             books = books.order_by('-created_at')
130
131         if after:
132             books = books_after(books, after, new_api)
133
134         prefetch_relations(books, 'author')
135         prefetch_relations(books, 'genre')
136         prefetch_relations(books, 'kind')
137         prefetch_relations(books, 'epoch')
138
139         if count:
140             books = books[:count]
141
142         return books
143
144     def post(self, request, **kwargs):
145         if kwargs.get('audiobooks'):
146             return self.post_audiobook(request, **kwargs)
147         else:
148             return self.post_book(request, **kwargs)
149
150     def post_book(self, request, **kwargs):
151         data = json.loads(request.POST.get('data'))
152         form = BookImportForm(data)
153         if form.is_valid():
154             form.save()
155             return Response({}, status=status.HTTP_201_CREATED)
156         else:
157             raise Http404
158
159     def post_audiobook(self, request, **kwargs):
160         index = int(request.POST['part_index'])
161         parts_count = int(request.POST['parts_count'])
162         media_type = request.POST['type'].lower()
163         source_sha1 = request.POST.get('source_sha1')
164         name = request.POST.get('name', '')
165         part_name = request.POST.get('part_name', '')
166
167         project_description = request.POST.get('project_description', '')
168         project_icon = request.POST.get('project_icon', '')
169
170         _rest, slug = request.POST['book'].rstrip('/').rsplit('/', 1)
171         book = Book.objects.get(slug=slug)
172
173         try:
174             assert source_sha1
175             bm = book.media.get(type=media_type, source_sha1=source_sha1)
176         except (AssertionError, BookMedia.DoesNotExist):
177             bm = BookMedia(book=book, type=media_type)
178         bm.name = name
179         bm.part_name = part_name
180         bm.index = index
181         bm.project_description = project_description
182         bm.project_icon = project_icon
183         bm.file.save(None, request.data['file'], save=False)
184         bm.save(parts_count=parts_count)
185
186         return Response({}, status=status.HTTP_201_CREATED)
187
188
189 class BookFilter(dfilters.FilterSet):
190     sort = dfilters.OrderingFilter(
191         fields=(
192             ('sort_key_author', 'alpha'),
193             ('popularity', 'popularity'),
194         )
195     )
196     tag = dfilters.ModelMultipleChoiceFilter(
197         field_name='tag_relations__tag',
198         queryset=Tag.objects.filter(category__in=('author', 'epoch', 'genre', 'kind')),
199         conjoined=True,
200     )
201
202
203 class BookList2(ListAPIView):
204     permission_classes = [DjangoModelPermissionsOrAnonReadOnly]
205     queryset = Book.objects.none()  # Required for DjangoModelPermissions
206     serializer_class = serializers.BookSerializer2
207     filter_backends = (
208         dfilters.DjangoFilterBackend,
209         filters.SearchFilter,
210     )
211     filterset_class = BookFilter
212     search_fields = [
213         'title',
214     ]
215
216     def get_queryset(self):
217         books = Book.objects.all()
218         books = books.filter(findable=True)
219         books = order_books(books, True)
220
221         return books
222
223
224 class BookList11Labs(BookList2):
225     serializer_class = serializers.BookSerializer11Labs
226
227     def get_queryset(self):
228         books = Book.objects.all()
229         books = books.filter(findable=True)
230         books = books.filter(license='')
231         books = order_books(books, True)
232
233         return books
234
235
236 @vary_on_auth  # Because of 'liked'.
237 class BookDetail(RetrieveAPIView):
238     queryset = Book.objects.all()
239     lookup_field = 'slug'
240     serializer_class = serializers.BookDetailSerializer
241
242
243 class BookDetail2(RetrieveAPIView):
244     queryset = Book.objects.all()
245     lookup_field = 'slug'
246     serializer_class = serializers.BookSerializer2
247
248
249 @vary_on_auth  # Because of embargo links.
250 class EbookList(BookList):
251     serializer_class = serializers.EbookSerializer
252
253
254 @method_decorator(never_cache, name='dispatch')
255 class Preview(LegacyListAPIView):
256     #queryset = Book.objects.filter(preview=True)
257     serializer_class = serializers.BookPreviewSerializer
258
259     def get_queryset(self):
260         qs = Book.objects.filter(preview=True)
261         # FIXME: temporary workaround for a problem with iOS app; see #3954.
262         if 'Darwin' in self.request.META.get('HTTP_USER_AGENT', '') and 'debug' not in self.request.GET:
263             qs = qs.none()
264         return qs
265
266
267 @vary_on_auth  # Because of 'liked'.
268 class FilterBookList(LegacyListAPIView):
269     serializer_class = serializers.FilterBookListSerializer
270
271     def parse_bool(self, s):
272         if s in ('true', 'false'):
273             return s == 'true'
274         else:
275             return None
276
277     def get_queryset(self):
278         key_sep = '$'
279         search_string = self.request.query_params.get('search')
280         is_lektura = self.parse_bool(self.request.query_params.get('lektura'))
281         is_audiobook = self.parse_bool(self.request.query_params.get('audiobook'))
282         preview = self.parse_bool(self.request.query_params.get('preview'))
283         if not Membership.is_active_for(self.request.user):
284             preview = False
285
286         new_api = self.request.query_params.get('new_api')
287         after = self.request.query_params.get('after')
288         count = int(self.request.query_params.get('count', 50))
289         books = order_books(Book.objects.distinct(), new_api)
290         books = books.filter(findable=True)
291         if is_lektura is not None:
292             books = books.filter(has_audience=is_lektura)
293         if is_audiobook is not None:
294             if is_audiobook:
295                 books = books.filter(media__type='mp3')
296             else:
297                 books = books.exclude(media__type='mp3')
298         if preview is not None:
299             books = books.filter(preview=preview)
300         for category in book_tag_categories:
301             category_plural = category + 's'
302             if category_plural in self.request.query_params:
303                 slugs = self.request.query_params[category_plural].split(',')
304                 tags = Tag.objects.filter(category=category, slug__in=slugs)
305                 books = Book.tagged.with_any(tags, books)
306         if (search_string is not None) and len(search_string) < 3:
307             search_string = None
308         if search_string:
309             search_string = re_escape(search_string)
310             books_author = books.filter(cached_author__iregex=r'\m' + search_string)
311             books_title = books.filter(title__iregex=r'\m' + search_string)
312             books_title = books_title.exclude(id__in=list(books_author.values_list('id', flat=True)))
313             if after and (key_sep in after):
314                 which, key = after.split(key_sep, 1)
315                 if which == 'title':
316                     book_lists = [(books_after(books_title, key, new_api), 'title')]
317                 else:  # which == 'author'
318                     book_lists = [(books_after(books_author, key, new_api), 'author'), (books_title, 'title')]
319             else:
320                 book_lists = [(books_author, 'author'), (books_title, 'title')]
321         else:
322             if after and key_sep in after:
323                 which, key = after.split(key_sep, 1)
324                 books = books_after(books, key, new_api)
325             book_lists = [(books, 'book')]
326
327         filtered_books = []
328         for book_list, label in book_lists:
329             for category in book_tag_categories:
330                 book_list = prefetch_relations(book_list, category)
331             remaining_count = count - len(filtered_books)
332             for book in book_list[:remaining_count]:
333                 book.key = '%s%s%s' % (
334                     label, key_sep, book.slug if not new_api else book.full_sort_key())
335                 filtered_books.append(book)
336             if len(filtered_books) == count:
337                 break
338
339         return filtered_books
340
341
342 class EpubView(RetrieveAPIView):
343     queryset = Book.objects.all()
344     lookup_field = 'slug'
345     permission_classes = [IsClubMember]
346
347     @method_decorator(never_cache)
348     def get(self, *args, **kwargs):
349         return HttpResponse(self.get_object().get_media('epub'))
350
351
352 class TagCategoryView(LegacyListAPIView):
353     serializer_class = serializers.TagSerializer
354
355     def get_queryset(self):
356         category = self.kwargs['category']
357         tags = Tag.objects.filter(category=category).exclude(items=None).order_by('slug')
358
359         after = self.request.query_params.get('after')
360         count = self.request.query_params.get('count')
361         if after:
362             tags = tags.filter(slug__gt=after)
363         if count:
364             tags = tags[:count]
365
366         return tags
367
368 class AuthorList(ListAPIView):
369     serializer_class = serializers.AuthorSerializer
370     queryset = Tag.objects.filter(category='author')
371
372 class AuthorView(RetrieveAPIView):
373     serializer_class = serializers.AuthorSerializer
374     queryset = Tag.objects.filter(category='author')
375     lookup_field = 'slug'
376
377 class EpochList(ListAPIView):
378     serializer_class = serializers.EpochSerializer
379     queryset = Tag.objects.filter(category='epoch')
380
381 class EpochView(RetrieveAPIView):
382     serializer_class = serializers.EpochSerializer
383     queryset = Tag.objects.filter(category='epoch')
384     lookup_field = 'slug'
385
386 class GenreList(ListAPIView):
387     serializer_class = serializers.GenreSerializer
388     queryset = Tag.objects.filter(category='genre')
389
390 class GenreView(RetrieveAPIView):
391     serializer_class = serializers.GenreSerializer
392     queryset = Tag.objects.filter(category='genre')
393     lookup_field = 'slug'
394
395 class KindList(ListAPIView):
396     serializer_class = serializers.KindSerializer
397     queryset = Tag.objects.filter(category='kind')
398
399 class KindView(RetrieveAPIView):
400     serializer_class = serializers.KindSerializer
401     queryset = Tag.objects.filter(category='kind')
402     lookup_field = 'slug'
403
404
405 class TagView(RetrieveAPIView):
406     permission_classes = [DjangoModelPermissionsOrAnonReadOnly]
407     serializer_class = serializers.TagDetailSerializer
408     queryset = Tag.objects.all()
409     
410     def get_object(self):
411         try:
412             return get_object_or_404(
413                 Tag,
414                 category=self.kwargs['category'],
415                 slug=self.kwargs['slug']
416             )
417         except Http404:
418             if self.request.method == 'POST':
419                 return Tag(
420                     category=self.kwargs['category'],
421                     slug=self.kwargs['slug']
422                 )
423             else:
424                 raise
425
426     def post(self, request, **kwargs):
427         data = json.loads(request.POST.get('data'))
428         fields = {
429             "name_pl": "name_pl",
430             "description_pl": "description_pl",
431             "plural": "plural",
432             "is_epoch_specific": "genre_epoch_specific",
433             "collective_noun": "collective_noun",
434             "adjective_feminine_singular": "adjective_feminine_singular",
435             "adjective_nonmasculine_plural": "adjective_nonmasculine_plural",
436             "genitive": "genitive",
437             "collective_noun": "collective_noun",
438             "gazeta_link": "gazeta_link",
439             "culturepl_link": "culturepl_link",
440             "wiki_link_pl": "wiki_link_pl",
441             "photo_attribution": "photo_attribution",
442         }
443         obj = self.get_object()
444         updated = set()
445         for data_field, model_field in fields.items():
446             value = data.get(data_field)
447             if value:
448                 if obj.category == 'author' and model_field == 'name_pl':
449                     obj.sort_key = sortify(value.lower())
450                     updated.add('sort_key')
451                     value = ' '.join(reversed([t.strip() for t in value.split(',', 1)]))
452                 setattr(obj, model_field, value)
453                 updated.add(model_field)
454         if data.get('photo'):
455             response = urlopen(data['photo'])
456             ext = response.headers.get('Content-Type', '').rsplit('/', 1)[-1]
457             obj.photo.save(
458                 "{}.{}".format(self.kwargs['slug'], ext),
459                 ContentFile(response.read()),
460                 save=False,
461             )
462             updated.add('photo')
463
464         if obj.pk:
465             obj.save(update_fields=updated, quick=True)
466         else:
467             obj.save()
468         return Response({})
469
470
471 @vary_on_auth  # Because of 'liked'.
472 class FragmentList(LegacyListAPIView):
473     serializer_class = serializers.FragmentSerializer
474
475     def get_queryset(self):
476         try:
477             tags, ancestors = read_tags(
478                 self.kwargs['tags'],
479                 self.request,
480                 allowed={'author', 'epoch', 'kind', 'genre', 'book', 'theme'}
481             )
482         except ValueError:
483             raise Http404
484         return Fragment.tagged.with_all(tags).filter(book__findable=True).select_related('book')
485
486
487 @vary_on_auth  # Because of 'liked'.
488 class FragmentView(RetrieveAPIView):
489     serializer_class = serializers.FragmentDetailSerializer
490
491     def get_object(self):
492         return get_object_or_404(
493             Fragment,
494             book__slug=self.kwargs['book'],
495             anchor=self.kwargs['anchor']
496         )
497
498
499 class SuggestedTags(ListAPIView):
500     serializer_class = serializers.FilterTagSerializer
501
502     def get_queryset(self):
503         tag_ids = self.request.GET.getlist('tag', [])
504         tags = [get_object_or_404(Tag, id=tid) for tid in tag_ids]
505         related_tags = list(t.id for t in get_top_level_related_tags(tags))
506         return Tag.objects.filter(id__in=related_tags)