+++ /dev/null
-# -*- coding: utf-8 -*-
-# This file is part of Wolnelektury, licensed under GNU Affero GPLv3 or later.
-# Copyright © Fundacja Nowoczesna Polska. See NOTICE for more information.
-#
-import cPickle
-from datetime import datetime
-from random import randint
-from StringIO import StringIO
-
-from django.core.files.base import ContentFile
-from django.db import models
-from django.db.models import permalink
-from django.utils.translation import ugettext_lazy as _
-from django.core.urlresolvers import reverse
-from django.db.models.signals import m2m_changed
-from django.contrib.auth.models import User
-from django.contrib.contenttypes.models import ContentType
-from django.contrib.contenttypes import generic
-from django.conf import settings
-
-from librarian import text
-from catalogue.fields import JSONField
-from catalogue.models import Book, Tag
-
-
-class Poem(models.Model):
- slug = models.SlugField(_('slug'), max_length=120, db_index=True)
- text = models.TextField(_('text'))
- created_by = models.ForeignKey(User, null=True)
- created_from = JSONField(_('extra information'), null=True, blank=True)
- created_at = models.DateTimeField(_('creation date'), auto_now_add=True, editable=False)
- seen_at = models.DateTimeField(_('last view date'), auto_now_add=True, editable=False)
- view_count = models.IntegerField(_('view count'), default=1)
-
- try:
- f = open(settings.LESMIANATOR_PICKLE)
- global_dictionary = cPickle.load(f)
- f.close()
- except:
- global_dictionary = {}
-
- def visit(self):
- self.view_count += 1
- self.seen_at = datetime.now()
- self.save()
-
- def __unicode__(self):
- return "%s (%s...)" % (self.slug, self.text[:20])
-
- @classmethod
- def write(cls, continuations=None, length=3, maxlen=1000):
- def choose_word(word, continuations):
- try:
- choices = sum((continuations[word][post] for post in continuations[word]))
- r = randint(0, choices - 1)
-
- for post in continuations[word]:
- r -= continuations[word][post]
- if r < 0:
- return post
- except KeyError:
- return ''
-
-
- if continuations is None:
- continuations = cls.global_dictionary
-
- letters = []
- word = u''
- empty = -10
- lines = 0
- if not continuations:
- maxlen = 0
- # want at least two lines, but let Lesmianator end his stanzas
- while (empty < 2 or lines < 2) and maxlen:
- letter = choose_word(word, continuations)
- letters.append(letter)
- word = word[-length+1:] + letter
- if letter == u'\n':
- # count non-empty lines
- if empty == 0:
- lines += 1
- #
- if lines >= 2:
- empty += 1
- lines += 1
- else:
- empty = 0
- maxlen -= 1
-
- return ''.join(letters).strip()
-
- def get_absolute_url(self):
- return reverse('get_poem', kwargs={'poem': self.slug})
-
-
-class Continuations(models.Model):
- pickle = models.FileField(_('Continuations file'), upload_to='lesmianator')
- content_type = models.ForeignKey(ContentType)
- object_id = models.PositiveIntegerField()
- content_object = generic.GenericForeignKey('content_type', 'object_id')
-
- class Meta:
- unique_together = (('content_type', 'object_id'), )
-
- def __unicode__(self):
- return "Continuations for: %s" % unicode(self.content_object)
-
- @staticmethod
- def join_conts(a, b):
- for pre in b:
- a.setdefault(pre, {})
- for post in b[pre]:
- a[pre].setdefault(post, 0)
- a[pre][post] += b[pre][post]
- return a
-
- @classmethod
- def for_book(cls, book, length=3):
- # count from this book only
- output = StringIO()
- f = open(book.xml_file.path)
- text.transform(f, output, False, ('raw-text',))
- f.close()
- conts = {}
- last_word = ''
- for letter in output.getvalue().decode('utf-8').strip().lower():
- mydict = conts.setdefault(last_word, {})
- mydict.setdefault(letter, 0)
- mydict[letter] += 1
- last_word = last_word[-length+1:] + letter
- # add children
- return reduce(cls.join_conts,
- (cls.get(child) for child in book.children.all()),
- conts)
-
- @classmethod
- def for_set(cls, tag):
- # book contains its descendants, we don't want them twice
- books = Book.tagged.with_any((tag,))
- l_tags = Tag.objects.filter(category='book', slug__in=[book.book_tag_slug() for book in books])
- descendants_keys = [book.pk for book in Book.tagged.with_any(l_tags)]
- if descendants_keys:
- books = books.exclude(pk__in=descendants_keys)
-
- cont_tabs = (cls.get(b) for b in books)
- return reduce(cls.join_conts, cont_tabs)
-
- @classmethod
- def get(cls, sth):
- object_type = ContentType.objects.get_for_model(sth)
- should_keys = set([sth.id])
- if isinstance(sth, Tag):
- should_keys = set(b.pk for b in Book.tagged.with_any((sth,)))
- try:
- obj = cls.objects.get(content_type=object_type, object_id=sth.id)
- if not obj.pickle:
- raise cls.DoesNotExist
- f = open(obj.pickle.path)
- keys, conts = cPickle.load(f)
- f.close()
- if set(keys) != should_keys:
- raise cls.DoesNotExist
- return conts
- except cls.DoesNotExist:
- if isinstance(sth, Book):
- conts = cls.for_book(sth)
- elif isinstance(sth, Tag):
- conts = cls.for_set(sth)
- else:
- raise NotImplemented('Lesmianator continuations: only Book and Tag supported')
-
- c, created = cls.objects.get_or_create(content_type=object_type, object_id=sth.id)
- c.pickle.save(sth.slug+'.p', ContentFile(cPickle.dumps((should_keys, conts))))
- c.save()
- return conts
-
-