forked from citizen-cyberscience-centre/app-categorize
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathget_images.py
61 lines (55 loc) · 2.15 KB
/
get_images.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
# -*- coding: utf-8 -*-
# This file is part of PyBOSSA.
#
# PyBOSSA is free software: you can redistribute it and/or modify
# it under the terms of the GNU Affero General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# PyBOSSA is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU Affero General Public License for more details.
#
# You should have received a copy of the GNU Affero General Public License
# along with PyBOSSA. If not, see <http://www.gnu.org/licenses/>.
import urllib
import urllib2
import re
import json
import string
def get_flickr_photos(size="big"):
"""
Gets public photos from Flickr feeds
:arg string size: Size of the image from Flickr feed.
:returns: A list of photos.
:rtype: list
"""
# Get the ID of the photos and load it in the output var
# add the 'ids': '25053835@N03' to the values dict if you want to
# specify a Flickr Person ID
print('Contacting Flickr for photos')
url = "http://api.flickr.com/services/feeds/photos_public.gne"
values = {'nojsoncallback': 1,
'format': "json"}
query = url + "?" + urllib.urlencode(values)
urlobj = urllib2.urlopen(query)
data = urlobj.read()
urlobj.close()
# The returned JSON object by Flickr is not correctly escaped,
# so we have to fix it see
# http://goo.gl/A9VNo
regex = re.compile(r'\\(?![/u"])')
fixed = regex.sub(r"\\\\", data)
output = json.loads(fixed)
print('Data retrieved from Flickr')
# For each photo ID create its direct URL according to its size:
# big, medium, small (or thumbnail) + Flickr page hosting the photo
photos = []
for idx, photo in enumerate(output['items']):
print 'Retrieved photo: %s' % idx
imgUrl_m = photo["media"]["m"]
imgUrl_b = string.replace(photo["media"]["m"], "_m.jpg", "_b.jpg")
photos.append({'link': photo["link"], 'url_m': imgUrl_m,
'url_b': imgUrl_b})
return photos