summaryrefslogtreecommitdiff
path: root/searx/engines
diff options
context:
space:
mode:
authorMarkus <markus@venom.fritz.box>2024-09-15 12:22:06 +0200
committerMarkus Heiser <markus.heiser@darmarIT.de>2024-09-15 12:48:35 +0200
commitcdb4927b8ba0aec61ae169b9e9b54a7e8f2f0e9f (patch)
treec3038e8e4f8622c2a9df9dc61894c5b95bc10d7f /searx/engines
parent84e2f9d46a7aada4347df7f4a79147170cc31dc0 (diff)
downloadsearxng-cdb4927b8ba0aec61ae169b9e9b54a7e8f2f0e9f.tar.gz
searxng-cdb4927b8ba0aec61ae169b9e9b54a7e8f2f0e9f.zip
[fix] fetch_traits: brave, google, annas_archive & radio_browser
This patch fixes a bug reported by CI "Fetch traits" [1] (brave) and improves other fetch traits functions (google, annas_archive & radio_browser). brave: File "/home/runner/work/searxng/searxng/searx/engines/brave.py", line 434, in fetch_traits sxng_tag = region_tag(babel.Locale.parse(ui_lang, sep='-')) ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ File "/home/runner/work/searxng/searxng/searx/locales.py", line 155, in region_tag Error: raise ValueError('%s missed a territory') google: change ERROR message about unknow UI language to INFO message radio_browser: country_list contains duplicates that differ only in upper/lower case annas_archive: for better diff; sort the persistence of the traits [1] https://github.com/searxng/searxng/actions/runs/10606312371/job/29433352518#step:6:41 Signed-off-by: Markus <markus@venom.fritz.box>
Diffstat (limited to 'searx/engines')
-rw-r--r--searx/engines/annas_archive.py5
-rw-r--r--searx/engines/brave.py5
-rw-r--r--searx/engines/google.py2
-rw-r--r--searx/engines/radio_browser.py6
4 files changed, 13 insertions, 5 deletions
diff --git a/searx/engines/annas_archive.py b/searx/engines/annas_archive.py
index a290dd06e..bc74b3c86 100644
--- a/searx/engines/annas_archive.py
+++ b/searx/engines/annas_archive.py
@@ -184,3 +184,8 @@ def fetch_traits(engine_traits: EngineTraits):
for x in eval_xpath_list(dom, "//form//select[@name='sort']//option"):
engine_traits.custom['sort'].append(x.get("value"))
+
+ # for better diff; sort the persistence of these traits
+ engine_traits.custom['content'].sort()
+ engine_traits.custom['ext'].sort()
+ engine_traits.custom['sort'].sort()
diff --git a/searx/engines/brave.py b/searx/engines/brave.py
index 4c43386ed..6f7e342e7 100644
--- a/searx/engines/brave.py
+++ b/searx/engines/brave.py
@@ -430,7 +430,8 @@ def fetch_traits(engine_traits: EngineTraits):
ui_lang = option.get('value')
try:
- if '-' in ui_lang and not ui_lang.startswith("zh-"):
+ l = babel.Locale.parse(ui_lang, sep='-')
+ if l.territory:
sxng_tag = region_tag(babel.Locale.parse(ui_lang, sep='-'))
else:
sxng_tag = language_tag(babel.Locale.parse(ui_lang, sep='-'))
@@ -453,7 +454,7 @@ def fetch_traits(engine_traits: EngineTraits):
if not resp.ok: # type: ignore
print("ERROR: response from Brave is not OK.")
- country_js = resp.text[resp.text.index("options:{all") + len('options:') :]
+ country_js = resp.text[resp.text.index("options:{all") + len('options:') :] # type: ignore
country_js = country_js[: country_js.index("},k={default")]
country_tags = js_variable_to_python(country_js)
diff --git a/searx/engines/google.py b/searx/engines/google.py
index f9215783c..5fb5e9a76 100644
--- a/searx/engines/google.py
+++ b/searx/engines/google.py
@@ -441,7 +441,7 @@ def fetch_traits(engine_traits: EngineTraits, add_domains: bool = True):
try:
locale = babel.Locale.parse(lang_map.get(eng_lang, eng_lang), sep='-')
except babel.UnknownLocaleError:
- print("ERROR: %s -> %s is unknown by babel" % (x.get("data-name"), eng_lang))
+ print("INFO: google UI language %s (%s) is unknown by babel" % (eng_lang, x.text.split("(")[0].strip()))
continue
sxng_lang = language_tag(locale)
diff --git a/searx/engines/radio_browser.py b/searx/engines/radio_browser.py
index c20580616..a8f07a638 100644
--- a/searx/engines/radio_browser.py
+++ b/searx/engines/radio_browser.py
@@ -165,10 +165,12 @@ def fetch_traits(engine_traits: EngineTraits):
countrycodes = set()
for region in country_list:
- if region['iso_3166_1'] not in babel_reg_list:
+ # country_list contains duplicates that differ only in upper/lower case
+ _reg = region['iso_3166_1'].upper()
+ if _reg not in babel_reg_list:
print(f"ERROR: region tag {region['iso_3166_1']} is unknown by babel")
continue
- countrycodes.add(region['iso_3166_1'])
+ countrycodes.add(_reg)
countrycodes = list(countrycodes)
countrycodes.sort()