diff options
author | Noémi Ványi <sitbackandwait@gmail.com> | 2021-03-13 20:27:47 +0100 |
---|---|---|
committer | Noémi Ványi <sitbackandwait@gmail.com> | 2021-03-13 21:18:09 +0100 |
commit | ff527e268170852563830bf5b29a65515a98d2bb (patch) | |
tree | 224dcdd2baab7e640eb3c5c76ee7dc21dcbc16ba /searx/engines | |
parent | 9292571304376c2c463fb26ee0db89298bb00e6c (diff) | |
download | searxng-ff527e268170852563830bf5b29a65515a98d2bb.tar.gz searxng-ff527e268170852563830bf5b29a65515a98d2bb.zip |
Add Solr engine
Diffstat (limited to 'searx/engines')
-rw-r--r-- | searx/engines/solr.py | 74 |
1 files changed, 74 insertions, 0 deletions
diff --git a/searx/engines/solr.py b/searx/engines/solr.py new file mode 100644 index 000000000..0bfcbab36 --- /dev/null +++ b/searx/engines/solr.py @@ -0,0 +1,74 @@ +# SPDX-License-Identifier: AGPL-3.0-or-later +""" + Solr +""" + +# pylint: disable=global-statement, missing-function-docstring + +from json import loads +from urllib.parse import urlencode +from searx.exceptions import SearxEngineAPIException + + +base_url = 'http://localhost:8983' +collection = '' +rows = 10 +sort = '' # sorting: asc or desc +field_list = 'name' # list of field names to display on the UI +default_fields = '' # default field to query +query_fields = '' # query fields +_search_url = '' +paging = True + + +def init(_): + if collection == '': + raise ValueError('collection cannot be empty') + + global _search_url + _search_url = base_url + '/solr/' + collection + '/select?{params}' + + +def request(query, params): + query_params = {'q': query, 'rows': rows} + if field_list != '': + query_params['fl'] = field_list + if query_fields != '': + query_params['qf'] = query_fields + if default_fields != '': + query_params['df'] = default_fields + if sort != '': + query_params['sort'] = sort + + if 'pageno' in params: + query_params['start'] = rows * (params['pageno'] - 1) + + params['url'] = _search_url.format(params=urlencode(query_params)) + + return params + + +def response(resp): + resp_json = __get_response(resp) + + results = [] + for result in resp_json['response']['docs']: + r = {key: str(value) for key, value in result.items()} + if len(r) == 0: + continue + r['template'] = 'key-value.html' + results.append(r) + + return results + + +def __get_response(resp): + try: + resp_json = loads(resp.text) + except Exception as e: + raise SearxEngineAPIException("failed to parse response") from e + + if 'error' in resp_json: + raise SearxEngineAPIException(resp_json['error']['msg']) + + return resp_json |