+ # Extract fragments
+ closed_fragments, open_fragments = html.extract_fragments(book.html_file.path)
+ book_themes = []
+ for fragment in closed_fragments.values():
+ text = fragment.to_string()
+ short_text = ''
+ if (len(MarkupString(text)) > 240):
+ short_text = MarkupString(text)[:160]
+ new_fragment = Fragment(text=text, short_text=short_text, anchor=fragment.id, book=book)
+
+ theme_names = [s.strip() for s in fragment.themes.split(',')]
+ themes = []
+ for theme_name in theme_names:
+ tag, created = Tag.objects.get_or_create(name=theme_name,
+ slug=slughifi(theme_name), sort_key=slughifi(theme_name), category='theme')
+ tag.save()
+ themes.append(tag)
+ new_fragment.save()
+ new_fragment.tags = list(book.tags) + themes
+ book_themes += themes
+
+ book_themes = set(book_themes)
+ book.tags = list(book.tags) + list(book_themes)