diff options
author | Adam Tauber <asciimoo@gmail.com> | 2021-03-15 15:39:39 +0100 |
---|---|---|
committer | GitHub <noreply@github.com> | 2021-03-15 15:39:39 +0100 |
commit | dd34ac396cca75ff7b1690b00161d6c7253f46d0 (patch) | |
tree | f272a0367e4e70f75b2f2216fa1c722874548538 /searx | |
parent | 1664258061f9e718320852339cf0bd6d3324a83e (diff) | |
parent | ff527e268170852563830bf5b29a65515a98d2bb (diff) | |
download | searxng-dd34ac396cca75ff7b1690b00161d6c7253f46d0.tar.gz searxng-dd34ac396cca75ff7b1690b00161d6c7253f46d0.zip |
Merge pull request #2652 from kvch/solr-engine
Add Apache Solr engine
Diffstat (limited to 'searx')
-rw-r--r-- | searx/engines/solr.py | 74 | ||||
-rw-r--r-- | searx/settings.yml | 11 |
2 files changed, 85 insertions, 0 deletions
diff --git a/searx/engines/solr.py b/searx/engines/solr.py new file mode 100644 index 000000000..0bfcbab36 --- /dev/null +++ b/searx/engines/solr.py @@ -0,0 +1,74 @@ +# SPDX-License-Identifier: AGPL-3.0-or-later +""" + Solr +""" + +# pylint: disable=global-statement, missing-function-docstring + +from json import loads +from urllib.parse import urlencode +from searx.exceptions import SearxEngineAPIException + + +base_url = 'http://localhost:8983' +collection = '' +rows = 10 +sort = '' # sorting: asc or desc +field_list = 'name' # list of field names to display on the UI +default_fields = '' # default field to query +query_fields = '' # query fields +_search_url = '' +paging = True + + +def init(_): + if collection == '': + raise ValueError('collection cannot be empty') + + global _search_url + _search_url = base_url + '/solr/' + collection + '/select?{params}' + + +def request(query, params): + query_params = {'q': query, 'rows': rows} + if field_list != '': + query_params['fl'] = field_list + if query_fields != '': + query_params['qf'] = query_fields + if default_fields != '': + query_params['df'] = default_fields + if sort != '': + query_params['sort'] = sort + + if 'pageno' in params: + query_params['start'] = rows * (params['pageno'] - 1) + + params['url'] = _search_url.format(params=urlencode(query_params)) + + return params + + +def response(resp): + resp_json = __get_response(resp) + + results = [] + for result in resp_json['response']['docs']: + r = {key: str(value) for key, value in result.items()} + if len(r) == 0: + continue + r['template'] = 'key-value.html' + results.append(r) + + return results + + +def __get_response(resp): + try: + resp_json = loads(resp.text) + except Exception as e: + raise SearxEngineAPIException("failed to parse response") from e + + if 'error' in resp_json: + raise SearxEngineAPIException(resp_json['error']['msg']) + + return resp_json diff --git a/searx/settings.yml b/searx/settings.yml index 3447777aa..a8d625b05 100644 --- a/searx/settings.yml +++ b/searx/settings.yml @@ -942,6 +942,17 @@ engines: # api_client_id : ******* # api_client_secret : ******* +# - name : solr +# engine : solr +# shortcut : slr +# base_url : http://localhost:8983 +# collection : collection_name +# sort : '' # sorting: asc or desc +# field_list : '' # comma separated list of field names to display on the UI +# default_fields : '' # default field to query +# query_fields : '' # query fields +# enable_http : True + - name : startpage engine : startpage shortcut : sp |