Made short text fragment text shorter.
[wolnelektury.git] / catalogue / models.py
1 # -*- coding: utf-8 -*-
2 from django.db import models
3 from django.db.models import permalink, Q
4 from django.utils.translation import ugettext_lazy as _
5 from django.contrib.auth.models import User
6 from django.core.files import File
7 from django.template.loader import render_to_string
8 from django.utils.safestring import mark_safe
9
10 from newtagging.models import TagBase
11 from newtagging import managers
12
13 from librarian import html
14
15
16 TAG_CATEGORIES = (
17     ('author', _('author')),
18     ('epoch', _('epoch')),
19     ('kind', _('kind')),
20     ('genre', _('genre')),
21     ('theme', _('theme')),
22     ('set', _('set')),
23 )
24
25
26 class TagSubcategoryManager(models.Manager):
27     def __init__(self, subcategory):
28         super(TagSubcategoryManager, self).__init__()
29         self.subcategory = subcategory
30         
31     def get_query_set(self):
32         return super(TagSubcategoryManager, self).get_query_set().filter(category=self.subcategory)
33
34
35 class Tag(TagBase):
36     name = models.CharField(_('name'), max_length=50, unique=True, db_index=True)
37     slug = models.SlugField(_('slug'), unique=True, db_index=True)
38     sort_key = models.SlugField(_('sort key'), db_index=True)
39     category = models.CharField(_('category'), max_length=50, blank=False, null=False, 
40         db_index=True, choices=TAG_CATEGORIES)
41     description = models.TextField(blank=True)
42     
43     user = models.ForeignKey(User, blank=True, null=True)
44     
45     def has_description(self):
46         return len(self.description) > 0
47     has_description.short_description = _('description')
48     has_description.boolean = True
49
50     @permalink
51     def get_absolute_url(self):
52         return ('catalogue.views.tagged_book_list', [self.slug])
53     
54     class Meta:
55         ordering = ('sort_key',)
56         verbose_name = _('tag')
57         verbose_name_plural = _('tags')
58     
59     def __unicode__(self):
60         return self.name
61
62     @staticmethod
63     def get_tag_list(tags):
64         if isinstance(tags, basestring):
65             tag_slugs = tags.split('/')
66             return [Tag.objects.get(slug=slug) for slug in tag_slugs]
67         else:
68             return TagBase.get_tag_list(tags)
69
70
71 class Book(models.Model):
72     title = models.CharField(_('title'), max_length=120)
73     slug = models.SlugField(_('slug'), unique=True, db_index=True)
74     description = models.TextField(_('description'), blank=True)
75     created_at = models.DateTimeField(_('creation date'), auto_now=True)
76     _short_html = models.TextField(_('short HTML'), editable=False)
77     
78     # Formats
79     xml_file = models.FileField(_('XML file'), upload_to='books/xml', blank=True)
80     pdf_file = models.FileField(_('PDF file'), upload_to='books/pdf', blank=True)
81     odt_file = models.FileField(_('ODT file'), upload_to='books/odt', blank=True)
82     html_file = models.FileField(_('HTML file'), upload_to='books/html', blank=True)
83     
84     objects = managers.ModelTaggedItemManager(Tag)
85     tags = managers.TagDescriptor(Tag)
86     
87     def short_html(self):
88         if len(self._short_html):
89             return mark_safe(self._short_html)
90         else:
91             tags = self.tags.filter(~Q(category__in=('set', 'theme')))
92             tags = [u'<a href="%s">%s</a>' % (tag.get_absolute_url(), tag.name) for tag in tags]
93
94             formats = []
95             if self.html_file:
96                 formats.append(u'<a href="%s">Czytaj online</a>' % self.html_file.url)
97             if self.pdf_file:
98                 formats.append(u'<a href="%s">Plik PDF</a>' % self.pdf_file.url)
99             if self.odt_file:
100                 formats.append(u'<a href="%s">Plik ODT</a>' % self.odt_file.url)
101             
102             self._short_html = render_to_string('catalogue/book_short.html',
103                 {'book': self, 'tags': tags, 'formats': formats})
104             self.save()
105             return mark_safe(self._short_html)
106     
107     def has_description(self):
108         return len(self.description) > 0
109     has_description.short_description = _('description')
110     has_description.boolean = True
111     
112     def has_pdf_file(self):
113         return bool(self.pdf_file)
114     has_pdf_file.short_description = 'PDF'
115     has_pdf_file.boolean = True
116     
117     def has_odt_file(self):
118         return bool(self.odt_file)
119     has_odt_file.short_description = 'ODT'
120     has_odt_file.boolean = True
121     
122     def has_html_file(self):
123         return bool(self.html_file)
124     has_html_file.short_description = 'HTML'
125     has_html_file.boolean = True
126
127     @staticmethod
128     def from_xml_file(xml_file):
129         from tempfile import NamedTemporaryFile
130         from slughifi import slughifi
131         import dcparser
132         from markupstring import MarkupString
133         import re
134         
135         # Read book metadata
136         book_info = dcparser.parse(xml_file)
137         book = Book(title=book_info.title, slug=slughifi(book_info.title))
138         book.save()
139         
140         book_tags = []
141         for category in ('kind', 'genre', 'author', 'epoch'):    
142             tag_name = getattr(book_info, category)
143             tag_sort_key = tag_name
144             if category == 'author':
145                 tag_sort_key = tag_name.last_name
146                 tag_name = ' '.join(tag_name.first_names) + ' ' + tag_name.last_name
147             tag, created = Tag.objects.get_or_create(name=tag_name,
148                 slug=slughifi(tag_name), sort_key=slughifi(tag_sort_key), category=category)
149             tag.save()
150             book_tags.append(tag)
151         book.tags = book_tags
152         
153         # Save XML and HTML files
154         book.xml_file.save('%s.xml' % book.slug, File(file(xml_file)), save=False)
155         
156         html_file = NamedTemporaryFile()
157         html.transform(book.xml_file.path, html_file)
158         book.html_file.save('%s.html' % book.slug, File(html_file), save=False)
159         
160         # Extract fragments
161         closed_fragments, open_fragments = html.extract_fragments(book.html_file.path)
162         book_themes = []
163         for fragment in closed_fragments.values():
164             text = fragment.to_string()
165             short_text = ''
166             if (len(re.sub(r'</?.*?>', '', text)) > 240):
167                 short_text = MarkupString(text)[:160]
168             new_fragment = Fragment(text=text, short_text=short_text, anchor=fragment.id, book=book)
169                 
170             theme_names = [s.strip() for s in fragment.themes.split(',')]
171             themes = []
172             for theme_name in theme_names:
173                 tag, created = Tag.objects.get_or_create(name=theme_name,
174                     slug=slughifi(theme_name), sort_key=slughifi(theme_name), category='theme')
175                 tag.save()
176                 themes.append(tag)
177             new_fragment.save()
178             new_fragment.tags = list(book.tags) + themes
179             book_themes += themes
180         
181         book_themes = set(book_themes)
182         book.tags = list(book.tags) + list(book_themes)
183         return book.save()
184     
185     @permalink
186     def get_absolute_url(self):
187         return ('catalogue.views.book_detail', [self.slug])
188         
189     class Meta:
190         ordering = ('title',)
191         verbose_name = _('book')
192         verbose_name_plural = _('books')
193
194     def __unicode__(self):
195         return self.title
196
197
198 class Fragment(models.Model):
199     text = models.TextField()
200     short_text = models.TextField(editable=False)
201     _short_html = models.TextField(editable=False)
202     anchor = models.IntegerField()
203     book = models.ForeignKey(Book, related_name='fragments')
204
205     objects = managers.ModelTaggedItemManager(Tag)
206     tags = managers.TagDescriptor(Tag)
207     
208     def short_html(self):
209         if len(self._short_html):
210             return mark_safe(self._short_html)
211         else:
212             book_authors = [u'<a href="%s">%s</a>' % (tag.get_absolute_url(), tag.name) 
213                 for tag in self.book.tags if tag.category == 'author']
214             
215             self._short_html = render_to_string('catalogue/fragment_short.html',
216                 {'fragment': self, 'book': self.book, 'book_authors': book_authors})
217             self.save()
218             return mark_safe(self._short_html)
219         
220     class Meta:
221         ordering = ('book', 'anchor',)
222         verbose_name = _('fragment')
223         verbose_name_plural = _('fragments')
224