summaryrefslogtreecommitdiff
path: root/searx/engines/unsplash.py
blob: dcca18ee6c0901e9b0106ab11667f4ff82a3e767 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
# SPDX-License-Identifier: AGPL-3.0-or-later
# lint: pylint
# pylint: disable=missing-function-docstring
"""Unsplash

"""

from urllib.parse import urlencode, urlparse, urlunparse, parse_qsl
from json import loads

# about
about = {
    "website": 'https://unsplash.com',
    "wikidata_id": 'Q28233552',
    "official_api_documentation": 'https://unsplash.com/developers',
    "use_official_api": False,
    "require_api_key": False,
    "results": 'JSON',
}

base_url = 'https://unsplash.com/'
search_url = base_url + 'napi/search/photos?'
categories = ['images']
page_size = 20
paging = True


def clean_url(url):
    parsed = urlparse(url)
    query = [(k, v) for (k, v)
             in parse_qsl(parsed.query) if k not in ['ixid', 's']]

    return urlunparse((
        parsed.scheme,
        parsed.netloc,
        parsed.path,
        parsed.params,
        urlencode(query),
        parsed.fragment
    ))


def request(query, params):
    params['url'] = search_url + urlencode({
        'query': query, 'page': params['pageno'], 'per_page': page_size
    })
    logger.debug("query_url --> %s", params['url'])
    return params


def response(resp):
    results = []
    json_data = loads(resp.text)

    if 'results' in json_data:
        for result in json_data['results']:
            results.append({
                'template': 'images.html',
                'url': clean_url(result['links']['html']),
                'thumbnail_src': clean_url(result['urls']['thumb']),
                'img_src': clean_url(result['urls']['raw']),
                'title': result.get('alt_description') or 'unknown',
                'content': result.get('description') or ''
            })

    return results