summaryrefslogtreecommitdiff
path: root/tests/unit/test_utils.py
diff options
context:
space:
mode:
authorMarkus Heiser <markus.heiser@darmarit.de>2023-02-07 14:11:58 +0100
committerMarkus Heiser <markus.heiser@darmarit.de>2023-03-24 10:37:42 +0100
commit16f0db44939c23d2980d6fd2e5dfada13d8f5ee9 (patch)
treeaff653cf2739f3d1fc35ac44b7adaa3ca0e14253 /tests/unit/test_utils.py
parent4d4aa13e1f1d254e5d57c67973a7809d9c1e21f9 (diff)
downloadsearxng-16f0db44939c23d2980d6fd2e5dfada13d8f5ee9.tar.gz
searxng-16f0db44939c23d2980d6fd2e5dfada13d8f5ee9.zip
[mod] replace utils.match_language by locales.match_locale
This patch replaces the *full of magic* ``utils.match_language`` function by a ``locales.match_locale``. The ``locales.match_locale`` function is based on the ``locales.build_engine_locales`` introduced in 9ae409a0 [1]. In the past SearXNG did only support a search by a language but not in a region. This has been changed a long time ago and regions have been added to SearXNG core but not to the engines. The ``utils.match_language`` was the function to handle the different aspects of language/regions in SearXNG core and the supported *languages* in the engine. The ``utils.match_language`` did it with some magic and works good for most use cases but fails in some edge case. To replace the concurrence of languages and regions in the SearXNG core the ``locales.build_engine_locales`` was introduced in 9ae409a0 [1]. With the last patches all engines has been migrated to a ``fetch_traits`` and a language/region concept that is based on ``locales.build_engine_locales``. To summarize: there is no longer a need for the ``locales.match_language``. [1] https://github.com/searxng/searxng/pull/1652 Signed-off-by: Markus Heiser <markus.heiser@darmarit.de>
Diffstat (limited to 'tests/unit/test_utils.py')
-rw-r--r--tests/unit/test_utils.py33
1 files changed, 0 insertions, 33 deletions
diff --git a/tests/unit/test_utils.py b/tests/unit/test_utils.py
index 6f51f1ee3..2ad4593a1 100644
--- a/tests/unit/test_utils.py
+++ b/tests/unit/test_utils.py
@@ -87,39 +87,6 @@ class TestUtils(SearxTestCase):
html = '<p><b>Lorem ipsum</i>dolor sit amet</p>'
self.assertEqual(utils.html_to_text(html), "Lorem ipsum")
- def test_match_language(self):
- self.assertEqual(utils.match_language('es', ['es']), 'es')
- self.assertEqual(utils.match_language('es', [], fallback='fallback'), 'fallback')
- self.assertEqual(utils.match_language('ja', ['jp'], {'ja': 'jp'}), 'jp')
-
- # handle script tags
- self.assertEqual(utils.match_language('zh-CN', ['zh-Hans-CN', 'zh-Hant-TW']), 'zh-Hans-CN')
- self.assertEqual(utils.match_language('zh-TW', ['zh-Hans-CN', 'zh-Hant-TW']), 'zh-Hant-TW')
- self.assertEqual(utils.match_language('zh-Hans-CN', ['zh-CN', 'zh-TW']), 'zh-CN')
- self.assertEqual(utils.match_language('zh-Hant-TW', ['zh-CN', 'zh-TW']), 'zh-TW')
- self.assertEqual(utils.match_language('zh-Hans', ['zh-CN', 'zh-TW', 'zh-HK']), 'zh-CN')
- self.assertEqual(utils.match_language('zh-Hant', ['zh-CN', 'zh-TW', 'zh-HK']), 'zh-TW')
-
- aliases = {'en-GB': 'en-UK', 'he': 'iw'}
-
- # guess country
- self.assertEqual(utils.match_language('de-DE', ['de']), 'de')
- self.assertEqual(utils.match_language('de', ['de-DE']), 'de-DE')
- self.assertEqual(utils.match_language('es-CO', ['es-AR', 'es-ES', 'es-MX']), 'es-ES')
- self.assertEqual(utils.match_language('es-CO', ['es-MX']), 'es-MX')
- self.assertEqual(utils.match_language('en-UK', ['en-AU', 'en-GB', 'en-US']), 'en-GB')
- self.assertEqual(utils.match_language('en-GB', ['en-AU', 'en-UK', 'en-US'], aliases), 'en-UK')
-
- # language aliases
- self.assertEqual(utils.match_language('iw', ['he']), 'he')
- self.assertEqual(utils.match_language('he', ['iw'], aliases), 'iw')
- self.assertEqual(utils.match_language('iw-IL', ['he']), 'he')
- self.assertEqual(utils.match_language('he-IL', ['iw'], aliases), 'iw')
- self.assertEqual(utils.match_language('iw', ['he-IL']), 'he-IL')
- self.assertEqual(utils.match_language('he', ['iw-IL'], aliases), 'iw-IL')
- self.assertEqual(utils.match_language('iw-IL', ['he-IL']), 'he-IL')
- self.assertEqual(utils.match_language('he-IL', ['iw-IL'], aliases), 'iw-IL')
-
def test_ecma_unscape(self):
self.assertEqual(utils.ecma_unescape('text%20with%20space'), 'text with space')
self.assertEqual(utils.ecma_unescape('text using %xx: %F3'), 'text using %xx: รณ')