diff options
author | Alexandre Flament <alex@al-f.net> | 2021-09-10 12:43:33 +0200 |
---|---|---|
committer | Alexandre Flament <alex@al-f.net> | 2021-09-11 13:23:06 +0200 |
commit | 0f43b39eac44d548143b3944a2bfa26c039b2068 (patch) | |
tree | b3791fd2e6efdea7e05e128b7a0f6bb1a237dff0 /searx | |
parent | b671e0364fbfb09701fb675ba23a7d7bebbcf744 (diff) | |
download | searxng-0f43b39eac44d548143b3944a2bfa26c039b2068.tar.gz searxng-0f43b39eac44d548143b3944a2bfa26c039b2068.zip |
[enh] add hostname_replace plugin
* backport of https://github.com/searx/searx/pull/2724
* allow to remove result if the replacement is the boolean value false
Diffstat (limited to 'searx')
-rw-r--r-- | searx/plugins/__init__.py | 2 | ||||
-rw-r--r-- | searx/plugins/hostname_replace.py | 32 | ||||
-rw-r--r-- | searx/settings.yml | 12 |
3 files changed, 45 insertions, 1 deletions
diff --git a/searx/plugins/__init__.py b/searx/plugins/__init__.py index 3a35f7025..1153c9ed1 100644 --- a/searx/plugins/__init__.py +++ b/searx/plugins/__init__.py @@ -31,6 +31,7 @@ from searx.plugins import (oa_doi_rewrite, hash_plugin, infinite_scroll, self_info, + hostname_replace, search_on_category_select, tracker_url_remover, vim_hotkeys) @@ -182,6 +183,7 @@ plugins.register(oa_doi_rewrite) plugins.register(hash_plugin) plugins.register(infinite_scroll) plugins.register(self_info) +plugins.register(hostname_replace) plugins.register(search_on_category_select) plugins.register(tracker_url_remover) plugins.register(vim_hotkeys) diff --git a/searx/plugins/hostname_replace.py b/searx/plugins/hostname_replace.py new file mode 100644 index 000000000..778b84615 --- /dev/null +++ b/searx/plugins/hostname_replace.py @@ -0,0 +1,32 @@ +# SPDX-License-Identifier: AGPL-3.0-or-later + +import re +from urllib.parse import urlunparse +from searx import settings +from searx.plugins import logger +from flask_babel import gettext + +name = gettext('Hostname replace') +description = gettext('Rewrite result hostnames or remove results based on the hostname') +default_on = False +preference_section = 'general' + +plugin_id = 'hostname_replace' + +replacements = {re.compile(p): r for (p, r) in settings[plugin_id].items()} if plugin_id in settings else {} + +logger = logger.getChild(plugin_id) +parsed = 'parsed_url' + + +def on_result(request, search, result): + if parsed not in result: + return True + for (pattern, replacement) in replacements.items(): + if pattern.search(result[parsed].netloc): + if not replacement: + return False + result[parsed] = result[parsed]._replace(netloc=pattern.sub(replacement, result[parsed].netloc)) + result['url'] = urlunparse(result[parsed]) + + return True diff --git a/searx/settings.yml b/searx/settings.yml index e5eb9dd65..8e2aeb5e9 100644 --- a/searx/settings.yml +++ b/searx/settings.yml @@ -150,7 +150,17 @@ outgoing: # # enabled_plugins: # - "HTTPS rewrite" -# - ... +# - "Hostname replace" # see configuration below + +# "Hostname replace" plugin configuration example: +# hostname_replace: +# '(.*\.)?youtube\.com$': 'invidious.example.com' +# '(.*\.)?youtu\.be$': 'invidious.example.com' +# '(.*\.)?youtube-noocookie\.com$': 'yotter.example.com' +# '(.*\.)?reddit\.com$': 'teddit.example.com' +# '(.*\.)?redd\.it$': 'teddit.example.com' +# '(www\.)?twitter\.com$': 'nitter.example.com' +# 'spam\.example\.com': false # remove results from spam.example.com checker: # disable checker when in debug mode |