apps/api/handlers.py

   1 # -*- coding: utf-8 -*-
   2 # This file is part of Wolnelektury, licensed under GNU Affero GPLv3 or later.
   3 # Copyright © Fundacja Nowoczesna Polska. See NOTICE for more information.
   4
   5 from datetime import datetime, timedelta
   6 import json
   7 from urlparse import urljoin
   8
   9 from django.conf import settings
  10 from django.contrib.sites.models import Site
  11 from django.core.cache import get_cache
  12 from django.core.urlresolvers import reverse
  13 from piston.handler import AnonymousBaseHandler, BaseHandler
  14 from piston.utils import rc
  15 from sorl.thumbnail import default
  16
  17 from api.helpers import timestamp
  18 from api.models import Deleted
  19 from catalogue.forms import BookImportForm
  20 from catalogue.models import Book, Tag, BookMedia, Fragment
  21 from picture.models import Picture
  22 from picture.forms import PictureImportForm
  23
  24 from stats.utils import piwik_track
  25
  26 API_BASE = WL_BASE = MEDIA_BASE = 'http://' + Site.objects.get_current().domain
  27
  28
  29 category_singular = {
  30     'authors': 'author',
  31     'kinds': 'kind',
  32     'genres': 'genre',
  33     'epochs': 'epoch',
  34     'themes': 'theme',
  35     'books': 'book',
  36 }
  37 category_plural={}
  38 for k, v in category_singular.items():
  39     category_plural[v] = k
  40
  41 book_tag_categories = ['author', 'epoch', 'kind', 'genre']
  42
  43
  44
  45 def read_tags(tags, allowed):
  46     """ Reads a path of filtering tags.
  47
  48     :param str tags: a path of category and slug pairs, like: authors/an-author/...
  49     :returns: list of Tag objects
  50     :raises: ValueError when tags can't be found
  51     """
  52     if not tags:
  53         return []
  54
  55     tags = tags.strip('/').split('/')
  56     real_tags = []
  57     while tags:
  58         category = tags.pop(0)
  59         slug = tags.pop(0)
  60
  61         try:
  62             category = category_singular[category]
  63         except KeyError:
  64             raise ValueError('Unknown category.')
  65
  66         if not category in allowed:
  67             raise ValueError('Category not allowed.')
  68
  69         # !^%@#$^#!
  70         if category == 'book':
  71             slug = 'l-' + slug
  72
  73         try:
  74             real_tags.append(Tag.objects.get(category=category, slug=slug))
  75         except Tag.DoesNotExist:
  76             raise ValueError('Tag not found')
  77     return real_tags
  78
  79
  80 # RESTful handlers
  81
  82
  83 class BookMediaHandler(BaseHandler):
  84     """ Responsible for representing media in Books. """
  85
  86     model = BookMedia
  87     fields = ['name', 'type', 'url', 'artist', 'director']
  88
  89     @classmethod
  90     def url(cls, media):
  91         """ Link to media on site. """
  92
  93         return MEDIA_BASE + media.file.url
  94
  95     @classmethod
  96     def artist(cls, media):
  97         return media.extra_info.get('artist_name', '')
  98
  99     @classmethod
 100     def director(cls, media):
 101         return media.extra_info.get('director_name', '')
 102
 103
 104
 105 class BookDetails(object):
 106     """Custom fields used for representing Books."""
 107
 108     @classmethod
 109     def author(cls, book):
 110         return ",".join(t[0] for t in book.related_info()['tags'].get('author', []))
 111
 112     @classmethod
 113     def href(cls, book):
 114         """ Returns an URI for a Book in the API. """
 115         return API_BASE + reverse("api_book", args=[book.slug])
 116
 117     @classmethod
 118     def url(cls, book):
 119         """ Returns Book's URL on the site. """
 120
 121         return WL_BASE + book.get_absolute_url()
 122
 123     @classmethod
 124     def children(cls, book):
 125         """ Returns all children for a book. """
 126
 127         return book.children.all()
 128
 129     @classmethod
 130     def media(cls, book):
 131         """ Returns all media for a book. """
 132         return book.media.all()
 133
 134     @classmethod
 135     def cover(cls, book):
 136         return MEDIA_BASE + book.cover.url if book.cover else ''
 137
 138     @classmethod
 139     def cover_thumb(cls, book):
 140         return MEDIA_BASE + default.backend.get_thumbnail(
 141                     book.cover, "139x193").url if book.cover else ''
 142
 143
 144
 145 class BookDetailHandler(BaseHandler, BookDetails):
 146     """ Main handler for Book objects.
 147
 148     Responsible for single Book details.
 149     """
 150     allowed_methods = ['GET']
 151     fields = ['title', 'parent', 'children'] + Book.formats + [
 152         'media', 'url', 'cover', 'cover_thumb'] + [
 153             category_plural[c] for c in book_tag_categories]
 154
 155     @piwik_track
 156     def read(self, request, book):
 157         """ Returns details of a book, identified by a slug and lang. """
 158         try:
 159             return Book.objects.get(slug=book)
 160         except Book.DoesNotExist:
 161             return rc.NOT_FOUND
 162
 163
 164 class AnonymousBooksHandler(AnonymousBaseHandler, BookDetails):
 165     """ Main handler for Book objects.
 166
 167     Responsible for lists of Book objects.
 168     """
 169     allowed_methods = ('GET',)
 170     model = Book
 171     fields = ['author', 'href', 'title', 'url', 'cover']
 172
 173     @piwik_track
 174     def read(self, request, tags, top_level=False,
 175                 audiobooks=False, daisy=False):
 176         """ Lists all books with given tags.
 177
 178         :param tags: filtering tags; should be a path of categories
 179              and slugs, i.e.: authors/an-author/epoch/an-epoch/
 180         :param top_level: if True and a book is included in the results,
 181              it's children are aren't. By default all books matching the tags
 182              are returned.
 183         """
 184         try:
 185             tags = read_tags(tags, allowed=book_tag_categories)
 186         except ValueError:
 187             return rc.NOT_FOUND
 188
 189         if tags:
 190             if top_level:
 191                 books = Book.tagged_top_level(tags)
 192                 return books if books else rc.NOT_FOUND
 193             else:
 194                 books = Book.tagged.with_all(tags)
 195         else:
 196             books = Book.objects.all()
 197
 198         if top_level:
 199             books = books.filter(parent=None)
 200         if audiobooks:
 201             books = books.filter(media__type='mp3').distinct()
 202         if daisy:
 203             books = books.filter(media__type='daisy').distinct()
 204
 205         if books.exists():
 206             return books
 207         else:
 208             return rc.NOT_FOUND
 209
 210     def create(self, request, *args, **kwargs):
 211         return rc.FORBIDDEN
 212
 213
 214 class BooksHandler(BookDetailHandler):
 215     allowed_methods = ('GET', 'POST')
 216     model = Book
 217     fields = ['author', 'href', 'title', 'url']
 218     anonymous = AnonymousBooksHandler
 219
 220     def create(self, request, *args, **kwargs):
 221         if not request.user.has_perm('catalogue.add_book'):
 222             return rc.FORBIDDEN
 223
 224         data = json.loads(request.POST.get('data'))
 225         form = BookImportForm(data)
 226         if form.is_valid():
 227             form.save()
 228             return rc.CREATED
 229         else:
 230             return rc.NOT_FOUND
 231
 232
 233 class EBooksHandler(AnonymousBooksHandler):
 234     fields = ('author', 'href', 'title', 'cover') + tuple(Book.ebook_formats)
 235
 236
 237 # add categorized tags fields for Book
 238 def _tags_getter(category):
 239     @classmethod
 240     def get_tags(cls, book):
 241         return book.tags.filter(category=category)
 242     return get_tags
 243 for plural, singular in category_singular.items():
 244     setattr(BookDetails, plural, _tags_getter(singular))
 245
 246 # add fields for files in Book
 247 def _file_getter(format):
 248     field = "%s_file" % format
 249     @classmethod
 250     def get_file(cls, book):
 251         f = getattr(book, field)
 252         if f:
 253             return MEDIA_BASE + f.url
 254         else:
 255             return ''
 256     return get_file
 257 for format in Book.formats:
 258     setattr(BookDetails, format, _file_getter(format))
 259
 260
 261 class TagDetails(object):
 262     """Custom Tag fields."""
 263
 264     @classmethod
 265     def href(cls, tag):
 266         """ Returns URI in the API for the tag. """
 267
 268         return API_BASE + reverse("api_tag", args=[category_plural[tag.category], tag.slug])
 269
 270     @classmethod
 271     def url(cls, tag):
 272         """ Returns URL on the site. """
 273
 274         return WL_BASE + tag.get_absolute_url()
 275
 276
 277 class TagDetailHandler(BaseHandler, TagDetails):
 278     """ Responsible for details of a single Tag object. """
 279
 280     fields = ['name', 'url', 'sort_key', 'description']
 281
 282     @piwik_track
 283     def read(self, request, category, slug):
 284         """ Returns details of a tag, identified by category and slug. """
 285
 286         try:
 287             category_sng = category_singular[category]
 288         except KeyError, e:
 289             return rc.NOT_FOUND
 290
 291         try:
 292             return Tag.objects.get(category=category_sng, slug=slug)
 293         except Tag.DoesNotExist:
 294             return rc.NOT_FOUND
 295
 296
 297 class TagsHandler(BaseHandler, TagDetails):
 298     """ Main handler for Tag objects.
 299
 300     Responsible for lists of Tag objects
 301     and fields used for representing Tags.
 302
 303     """
 304     allowed_methods = ('GET',)
 305     model = Tag
 306     fields = ['name', 'href', 'url']
 307
 308     @piwik_track
 309     def read(self, request, category):
 310         """ Lists all tags in the category (eg. all themes). """
 311
 312         try:
 313             category_sng = category_singular[category]
 314         except KeyError, e:
 315             return rc.NOT_FOUND
 316
 317         tags = Tag.objects.filter(category=category_sng).exclude(book_count=0)
 318         if tags.exists():
 319             return tags
 320         else:
 321             return rc.NOT_FOUND
 322
 323
 324 class FragmentDetails(object):
 325     """Custom Fragment fields."""
 326
 327     @classmethod
 328     def href(cls, fragment):
 329         """ Returns URI in the API for the fragment. """
 330
 331         return API_BASE + reverse("api_fragment",
 332             args=[fragment.book.slug, fragment.anchor])
 333
 334     @classmethod
 335     def url(cls, fragment):
 336         """ Returns URL on the site for the fragment. """
 337
 338         return WL_BASE + fragment.get_absolute_url()
 339
 340     @classmethod
 341     def themes(cls, fragment):
 342         """ Returns a list of theme tags for the fragment. """
 343
 344         return fragment.tags.filter(category='theme')
 345
 346
 347 class FragmentDetailHandler(BaseHandler, FragmentDetails):
 348     fields = ['book', 'anchor', 'text', 'url', 'themes']
 349
 350     @piwik_track
 351     def read(self, request, book, anchor):
 352         """ Returns details of a fragment, identified by book slug and anchor. """
 353         try:
 354             return Fragment.objects.get(book__slug=book, anchor=anchor)
 355         except Fragment.DoesNotExist:
 356             return rc.NOT_FOUND
 357
 358
 359 class FragmentsHandler(BaseHandler, FragmentDetails):
 360     """ Main handler for Fragments.
 361
 362     Responsible for lists of Fragment objects
 363     and fields used for representing Fragments.
 364
 365     """
 366     model = Fragment
 367     fields = ['book', 'url', 'anchor', 'href']
 368     allowed_methods = ('GET',)
 369
 370     categories = set(['author', 'epoch', 'kind', 'genre', 'book', 'theme'])
 371
 372     @piwik_track
 373     def read(self, request, tags):
 374         """ Lists all fragments with given book, tags, themes.
 375
 376         :param tags: should be a path of categories and slugs, i.e.:
 377              books/book-slug/authors/an-author/themes/a-theme/
 378
 379         """
 380         try:
 381             tags = read_tags(tags, allowed=self.categories)
 382         except ValueError:
 383             return rc.NOT_FOUND
 384         fragments = Fragment.tagged.with_all(tags).select_related('book')
 385         if fragments.exists():
 386             return fragments
 387         else:
 388             return rc.NOT_FOUND
 389
 390
 391
 392 # Changes handlers
 393
 394 class CatalogueHandler(BaseHandler):
 395
 396     @staticmethod
 397     def fields(request, name):
 398         fields_str = request.GET.get(name) if request is not None else None
 399         return fields_str.split(',') if fields_str is not None else None
 400
 401     @staticmethod
 402     def until(t=None):
 403         """ Returns time suitable for use as upper time boundary for check.
 404
 405             Used to avoid issues with time between setting the change stamp
 406             and actually saving the model in database.
 407             Cuts the microsecond part to avoid issues with DBs where time has
 408             more precision.
 409
 410             :param datetime t: manually sets the upper boundary
 411
 412         """
 413         # set to five minutes ago, to avoid concurrency issues
 414         if t is None:
 415             t = datetime.now() - timedelta(seconds=settings.API_WAIT)
 416         # set to whole second in case DB supports something smaller
 417         return t.replace(microsecond=0)
 418
 419     @staticmethod
 420     def book_dict(book, fields=None):
 421         all_fields = ['url', 'title', 'description',
 422                       'gazeta_link', 'wiki_link',
 423                       ] + Book.formats + BookMedia.formats.keys() + [
 424                       'parent', 'parent_number',
 425                       'tags',
 426                       'license', 'license_description', 'source_name',
 427                       'technical_editors', 'editors',
 428                       'author', 'sort_key',
 429                      ]
 430         if fields:
 431             fields = (f for f in fields if f in all_fields)
 432         else:
 433             fields = all_fields
 434
 435         extra_info = book.extra_info
 436
 437         obj = {}
 438         for field in fields:
 439
 440             if field in Book.formats:
 441                 f = getattr(book, field+'_file')
 442                 if f:
 443                     obj[field] = {
 444                         'url': f.url,
 445                         'size': f.size,
 446                     }
 447
 448             elif field in BookMedia.formats:
 449                 media = []
 450                 for m in book.media.filter(type=field).iterator():
 451                     media.append({
 452                         'url': m.file.url,
 453                         'size': m.file.size,
 454                     })
 455                 if media:
 456                     obj[field] = media
 457
 458             elif field == 'url':
 459                 obj[field] = book.get_absolute_url()
 460
 461             elif field == 'tags':
 462                 obj[field] = [t.id for t in book.tags.exclude(category__in=('book', 'set')).iterator()]
 463
 464             elif field == 'author':
 465                 obj[field] = ", ".join(t.name for t in book.tags.filter(category='author').iterator())
 466
 467             elif field == 'parent':
 468                 obj[field] = book.parent_id
 469
 470             elif field in ('license', 'license_description', 'source_name',
 471                       'technical_editors', 'editors'):
 472                 f = extra_info.get(field)
 473                 if f:
 474                     obj[field] = f
 475
 476             else:
 477                 f = getattr(book, field)
 478                 if f:
 479                     obj[field] = f
 480
 481         obj['id'] = book.id
 482         return obj
 483
 484     @classmethod
 485     def book_changes(cls, request=None, since=0, until=None, fields=None):
 486         since = datetime.fromtimestamp(int(since))
 487         until = cls.until(until)
 488
 489         changes = {
 490             'time_checked': timestamp(until)
 491         }
 492
 493         if not fields:
 494             fields = cls.fields(request, 'book_fields')
 495
 496         added = []
 497         updated = []
 498         deleted = []
 499
 500         last_change = since
 501         for book in Book.objects.filter(changed_at__gte=since,
 502                     changed_at__lt=until).iterator():
 503             book_d = cls.book_dict(book, fields)
 504             updated.append(book_d)
 505         if updated:
 506             changes['updated'] = updated
 507
 508         for book in Deleted.objects.filter(content_type=Book,
 509                     deleted_at__gte=since,
 510                     deleted_at__lt=until,
 511                     created_at__lt=since).iterator():
 512             deleted.append(book.id)
 513         if deleted:
 514             changes['deleted'] = deleted
 515
 516         return changes
 517
 518     @staticmethod
 519     def tag_dict(tag, fields=None):
 520         all_fields = ('name', 'category', 'sort_key', 'description',
 521                       'gazeta_link', 'wiki_link',
 522                       'url', 'books',
 523                      )
 524
 525         if fields:
 526             fields = (f for f in fields if f in all_fields)
 527         else:
 528             fields = all_fields
 529
 530         obj = {}
 531         for field in fields:
 532
 533             if field == 'url':
 534                 obj[field] = tag.get_absolute_url()
 535
 536             elif field == 'books':
 537                 obj[field] = [b.id for b in Book.tagged_top_level([tag]).iterator()]
 538
 539             elif field == 'sort_key':
 540                 obj[field] = tag.sort_key
 541
 542             else:
 543                 f = getattr(tag, field)
 544                 if f:
 545                     obj[field] = f
 546
 547         obj['id'] = tag.id
 548         return obj
 549
 550     @classmethod
 551     def tag_changes(cls, request=None, since=0, until=None, fields=None, categories=None):
 552         since = datetime.fromtimestamp(int(since))
 553         until = cls.until(until)
 554
 555         changes = {
 556             'time_checked': timestamp(until)
 557         }
 558
 559         if not fields:
 560             fields = cls.fields(request, 'tag_fields')
 561         if not categories:
 562             categories = cls.fields(request, 'tag_categories')
 563
 564         all_categories = ('author', 'epoch', 'kind', 'genre')
 565         if categories:
 566             categories = (c for c in categories if c in all_categories)
 567         else:
 568             categories = all_categories
 569
 570         updated = []
 571         deleted = []
 572
 573         for tag in Tag.objects.filter(category__in=categories,
 574                     changed_at__gte=since,
 575                     changed_at__lt=until).iterator():
 576             # only serve non-empty tags
 577             if tag.book_count:
 578                 tag_d = cls.tag_dict(tag, fields)
 579                 updated.append(tag_d)
 580             elif tag.created_at < since:
 581                 deleted.append(tag.id)
 582         if updated:
 583             changes['updated'] = updated
 584
 585         for tag in Deleted.objects.filter(category__in=categories,
 586                 content_type=Tag,
 587                     deleted_at__gte=since,
 588                     deleted_at__lt=until,
 589                     created_at__lt=since).iterator():
 590             deleted.append(tag.id)
 591         if deleted:
 592             changes['deleted'] = deleted
 593
 594         return changes
 595
 596     @classmethod
 597     def changes(cls, request=None, since=0, until=None, book_fields=None,
 598                 tag_fields=None, tag_categories=None):
 599         until = cls.until(until)
 600         since = int(since)
 601
 602         if not since:
 603             cache = get_cache('api')
 604             key = hash((book_fields, tag_fields, tag_categories,
 605                     tuple(sorted(request.GET.items()))
 606                   ))
 607             value = cache.get(key)
 608             if value is not None:
 609                 return value
 610
 611         changes = {
 612             'time_checked': timestamp(until)
 613         }
 614
 615         changes_by_type = {
 616             'books': cls.book_changes(request, since, until, book_fields),
 617             'tags': cls.tag_changes(request, since, until, tag_fields, tag_categories),
 618         }
 619
 620         for model in changes_by_type:
 621             for field in changes_by_type[model]:
 622                 if field == 'time_checked':
 623                     continue
 624                 changes.setdefault(field, {})[model] = changes_by_type[model][field]
 625
 626         if not since:
 627             cache.set(key, changes)
 628
 629         return changes
 630
 631
 632 class BookChangesHandler(CatalogueHandler):
 633     allowed_methods = ('GET',)
 634
 635     @piwik_track
 636     def read(self, request, since):
 637         return self.book_changes(request, since)
 638
 639
 640 class TagChangesHandler(CatalogueHandler):
 641     allowed_methods = ('GET',)
 642
 643     @piwik_track
 644     def read(self, request, since):
 645         return self.tag_changes(request, since)
 646
 647
 648 class ChangesHandler(CatalogueHandler):
 649     allowed_methods = ('GET',)
 650
 651     @piwik_track
 652     def read(self, request, since):
 653         return self.changes(request, since)
 654
 655
 656 class PictureHandler(BaseHandler):
 657     model = Picture
 658     fields = ('slug', 'title')
 659     allowed_methods = ('POST',)
 660
 661     def create(self, request):
 662         if not request.user.has_perm('picture.add_picture'):
 663             return rc.FORBIDDEN
 664
 665         data = json.loads(request.POST.get('data'))
 666         form = PictureImportForm(data)
 667         if form.is_valid():
 668             form.save()
 669             return rc.CREATED
 670         else:
 671             return rc.NOT_FOUND