summaryrefslogtreecommitdiff
path: root/searx/engines/bpb.py
diff options
context:
space:
mode:
authorBnyro <bnyro@tutanota.com>2023-10-05 17:37:59 +0200
committerMarkus Heiser <markus.heiser@darmarIT.de>2023-11-27 16:46:41 +0100
commitbf75a8c2a0151faf258c0cc5f2210f42d7fe6e1f (patch)
tree26a75da1484b7e14029cf062c9b276e6cf52e15d /searx/engines/bpb.py
parent04cfce2eb845c0dfc7d578a6fb3c44cb546b2028 (diff)
downloadsearxng-bf75a8c2a0151faf258c0cc5f2210f42d7fe6e1f.tar.gz
searxng-bf75a8c2a0151faf258c0cc5f2210f42d7fe6e1f.zip
[feat] engine: implementation of bpb
Diffstat (limited to 'searx/engines/bpb.py')
-rw-r--r--searx/engines/bpb.py68
1 files changed, 68 insertions, 0 deletions
diff --git a/searx/engines/bpb.py b/searx/engines/bpb.py
new file mode 100644
index 000000000..5d6359aae
--- /dev/null
+++ b/searx/engines/bpb.py
@@ -0,0 +1,68 @@
+# SPDX-License-Identifier: AGPL-3.0-or-later
+# lint: pylint
+"""BPB refers to ``Bundeszentrale für poltische Bildung``, which is a German
+governmental institution aiming to reduce misinformation by providing resources
+about politics and history.
+"""
+
+from datetime import datetime
+from urllib.parse import urlencode
+
+about = {
+ 'website': "https://www.bpb.de",
+ 'official_api_documentation': None,
+ 'use_official_api': False,
+ 'require_api_key': False,
+ 'results': 'JSON',
+ 'language': 'de',
+}
+
+paging = True
+categories = ['general']
+
+
+base_url = "https://www.bpb.de"
+
+
+def request(query, params):
+ args = {
+ 'query[term]': query,
+ 'page': params['pageno'] - 1,
+ 'sort[direction]': 'descending',
+ 'payload[nid]': 65350,
+ }
+ params['url'] = f"{base_url}/bpbapi/filter/search?{urlencode(args)}"
+ return params
+
+
+def response(resp):
+ results = []
+
+ json_resp = resp.json()
+
+ for result in json_resp['teaser']:
+ img_src = None
+ if result['teaser']['image']:
+ img_src = base_url + result['teaser']['image']['sources'][-1]['url']
+
+ metadata = result['extension']['overline']
+ authors = ', '.join(author['name'] for author in result['extension'].get('authors', []))
+ if authors:
+ metadata += f" | {authors}"
+
+ publishedDate = None
+ if result['extension'].get('publishingDate'):
+ publishedDate = datetime.utcfromtimestamp(result['extension']['publishingDate'])
+
+ results.append(
+ {
+ 'url': base_url + result['teaser']['link']['url'],
+ 'title': result['teaser']['title'],
+ 'content': result['teaser']['text'],
+ 'img_src': img_src,
+ 'publishedDate': publishedDate,
+ 'metadata': metadata,
+ }
+ )
+
+ return results