summaryrefslogtreecommitdiff
path: root/searx
diff options
context:
space:
mode:
authorMarkus Heiser <markus.heiser@darmarit.de>2022-02-13 12:34:04 +0100
committerMarkus Heiser <markus.heiser@darmarit.de>2022-02-18 18:59:58 +0100
commit795e8af61dcb6f669ccc653f6524f652f7d62a5c (patch)
tree80b2814d5a34fca1143f3329e51c7de371888fd5 /searx
parent98cab4cf754752e8a615b7b6c2685021592889a7 (diff)
downloadsearxng-795e8af61dcb6f669ccc653f6524f652f7d62a5c.tar.gz
searxng-795e8af61dcb6f669ccc653f6524f652f7d62a5c.zip
[fix] hostname_replace.py: don't stop replace URL in fields
This is a rewrite of the hostname_replace.py that: - don't stop to replace URL in fields ('data_src', 'audio_src') if there isn't a 'parsed_url', - adds a comment about keep or remove a result from the result list - adds a loop over ['data_src', 'audio_src'] instead of doubling code lines Signed-off-by: Markus Heiser <markus.heiser@darmarit.de>
Diffstat (limited to 'searx')
-rw-r--r--searx/plugins/hostname_replace.py38
1 files changed, 21 insertions, 17 deletions
diff --git a/searx/plugins/hostname_replace.py b/searx/plugins/hostname_replace.py
index acbc6304c..51bd003b1 100644
--- a/searx/plugins/hostname_replace.py
+++ b/searx/plugins/hostname_replace.py
@@ -17,26 +17,30 @@ replacements = {re.compile(p): r for (p, r) in settings[plugin_id].items()} if p
logger = logger.getChild(plugin_id)
parsed = 'parsed_url'
+_url_fields = ['data_src', 'audio_src']
def on_result(request, search, result):
- if parsed not in result:
- return True
+
for (pattern, replacement) in replacements.items():
- if pattern.search(result[parsed].netloc):
- if not replacement:
- return False
- result[parsed] = result[parsed]._replace(netloc=pattern.sub(replacement, result[parsed].netloc))
- result['url'] = urlunparse(result[parsed])
- if result.get('data_src', False):
- parsed_data_src = urlparse(result['data_src'])
- if pattern.search(parsed_data_src.netloc):
- parsed_data_src = parsed_data_src._replace(netloc=pattern.sub(replacement, parsed_data_src.netloc))
- result['data_src'] = urlunparse(parsed_data_src)
- if result.get('audio_src', False):
- parsed_audio_src = urlparse(result['audio_src'])
- if pattern.search(parsed_audio_src.netloc):
- parsed_audio_src = parsed_audio_src._replace(netloc=pattern.sub(replacement, parsed_audio_src.netloc))
- result['audio_src'] = urlunparse(parsed_audio_src)
+
+ if parsed in result:
+ if pattern.search(result[parsed].netloc):
+ # to keep or remove this result from the result list depends
+ # (only) on the 'parsed_url'
+ if not replacement:
+ return False
+ result[parsed] = result[parsed]._replace(netloc=pattern.sub(replacement, result[parsed].netloc))
+ result['url'] = urlunparse(result[parsed])
+
+ for url_field in _url_fields:
+ if result.get(url_field):
+ url_src = urlparse(result[url_field])
+ if pattern.search(url_src.netloc):
+ if not replacement:
+ del result[url_field]
+ else:
+ url_src = url_src._replace(netloc=pattern.sub(replacement, url_src.netloc))
+ result[url_field] = urlunparse(url_src)
return True