X-Git-Url: https://git.mdrn.pl/redakcja.git/blobdiff_plain/0f84fb864cfe3f6c642706f40933ede6a74fe0c4..e08b9a9ce539493a925abad05a1a2900aa80583e:/apps/cover/forms.py?ds=sidebyside
diff --git a/apps/cover/forms.py b/apps/cover/forms.py
index e6ffdff4..e4c949c8 100755
--- a/apps/cover/forms.py
+++ b/apps/cover/forms.py
@@ -3,6 +3,7 @@
# This file is part of FNP-Redakcja, licensed under GNU Affero GPLv3 or later.
# Copyright © Fundacja Nowoczesna Polska. See NOTICE for more information.
#
+import json
import re
from urllib2 import urlopen
from django import forms
@@ -62,6 +63,7 @@ class FlickrForm(forms.Form):
def clean_source_url(self):
def normalize_html(html):
+ return html
return re.sub('[\t\n]', '', html)
url = self.cleaned_data['source_url']
@@ -75,7 +77,7 @@ class FlickrForm(forms.Form):
html = normalize_html(urlopen(url).read().decode('utf-8'))
except:
raise forms.ValidationError('Error reading page.')
- match = re.search(r'Some rights reserved', html)
+ match = re.search(r']* rel="license ', html)
try:
assert match
license_url = match.group(1)
@@ -87,22 +89,21 @@ class FlickrForm(forms.Form):
except AssertionError:
raise forms.ValidationError('Error reading license name.')
- m = re.search(r'"ownername":"([^"]*)', html)
+ m = re.search(r']* class="owner-name [^>]*>([^<]*)<', html)
if m:
self.cleaned_data['author'] = "%s@Flickr" % m.group(1)
else:
raise forms.ValidationError('Error reading author name.')
- m = re.search(r']*>(.*?)
', html)
+ m = re.search(r']*>(.*?)
', html, re.S)
if not m:
raise forms.ValidationError('Error reading image title.')
- self.cleaned_data['title'] = m.group(1)
+ self.cleaned_data['title'] = m.group(1).strip()
- url_size = base_url + "sizes/o/"
- html = normalize_html(urlopen(url_size).read().decode('utf-8'))
- m = re.search(r'\s*