From 7b6b772e3485c60c4c1a3abda8d7bd862ea9d858 Mon Sep 17 00:00:00 2001 From: Markus Heiser Date: Wed, 27 Nov 2024 14:56:14 +0100 Subject: [fix] wikicommons engine: remove HTML tags from result items BTW: humanize filesize (Bytes) to KB, MB, GB .. Signed-off-by: Markus Heiser --- searx/engines/wikicommons.py | 6 ++++-- 1 file changed, 4 insertions(+), 2 deletions(-) diff --git a/searx/engines/wikicommons.py b/searx/engines/wikicommons.py index a229d24b6..214881bed 100644 --- a/searx/engines/wikicommons.py +++ b/searx/engines/wikicommons.py @@ -7,6 +7,8 @@ import datetime from urllib.parse import urlencode +from searx.utils import html_to_text, humanize_bytes + # about about = { "website": 'https://commons.wikimedia.org/', @@ -74,7 +76,7 @@ def response(resp): result = { 'url': imageinfo["descriptionurl"], 'title': title, - 'content': item["snippet"], + 'content': html_to_text(item["snippet"]), } if search_type == "images": @@ -93,7 +95,7 @@ def response(resp): elif search_type == "files": result['template'] = 'files.html' result['metadata'] = imageinfo['mime'] - result['size'] = imageinfo['size'] + result['size'] = humanize_bytes(imageinfo['size']) elif search_type == "audio": result['iframe_src'] = imageinfo['url'] -- cgit v1.2.3-54-g00ecf