diff options
author | Denis Wernert <deniswernert@gmail.com> | 2018-10-08 14:56:20 +0200 |
---|---|---|
committer | Denis Wernert <deniswernert@gmail.com> | 2018-10-08 14:56:20 +0200 |
commit | b9ada93b3ade2b4268bdc898e2c67b156b4dba92 (patch) | |
tree | 7b0a9baf2af19d200a8dec804aa0d31c947057ee /searx/engines/unsplash.py | |
parent | ee07a5e75005deb5d846f404f350aefd96b11b2d (diff) | |
download | searxng-b9ada93b3ade2b4268bdc898e2c67b156b4dba92.tar.gz searxng-b9ada93b3ade2b4268bdc898e2c67b156b4dba92.zip |
Removes what looks like tracking parameters
Diffstat (limited to 'searx/engines/unsplash.py')
-rw-r--r-- | searx/engines/unsplash.py | 20 |
1 files changed, 16 insertions, 4 deletions
diff --git a/searx/engines/unsplash.py b/searx/engines/unsplash.py index 04a943297..2e8d6fdfc 100644 --- a/searx/engines/unsplash.py +++ b/searx/engines/unsplash.py @@ -10,7 +10,7 @@ @parse url, title, img_src, thumbnail_src """ -from searx.url_utils import urlencode +from searx.url_utils import urlencode, urlparse, urlunparse, parse_qsl from json import loads url = 'https://unsplash.com/' @@ -20,6 +20,18 @@ page_size = 20 paging = True +def clean_url(url): + parsed = urlparse(url) + query = [(k, v) for (k, v) in parse_qsl(parsed.query) if k not in ['ixid', 's']] + + return urlunparse((parsed.scheme, + parsed.netloc, + parsed.path, + parsed.params, + urlencode(query), + parsed.fragment)) + + def request(query, params): params['url'] = search_url + urlencode({'query': query, 'page': params['pageno'], 'per_page': page_size}) return params @@ -32,9 +44,9 @@ def response(resp): if 'results' in json_data: for result in json_data['results']: results.append({'template': 'images.html', - 'url': result['links']['html'], - 'thumbnail_src': result['urls']['thumb'], - 'img_src': result['urls']['raw'], + 'url': clean_url(result['links']['html']), + 'thumbnail_src': clean_url(result['urls']['thumb']), + 'img_src': clean_url(result['urls']['raw']), 'title': result['description'], 'content': ''}) return results |