diff options
author | marc <a01200356@itesm.mx> | 2016-12-28 23:24:56 -0600 |
---|---|---|
committer | marc <a01200356@itesm.mx> | 2016-12-29 01:55:30 -0600 |
commit | 1175b3906f801c2ad3b6aa1f0718aedd7811dd5f (patch) | |
tree | 54ad08f8e7a4bbbb101c732efb1df872c4ceadd6 /searx/engines | |
parent | 7388067f1546f560830a25d0082c0ab9fc1cba34 (diff) | |
download | searxng-1175b3906f801c2ad3b6aa1f0718aedd7811dd5f.tar.gz searxng-1175b3906f801c2ad3b6aa1f0718aedd7811dd5f.zip |
change language list to only include languages with a minimum of engines
that support them.
users can still query lesser supported through the :lang_code bang.
Diffstat (limited to 'searx/engines')
-rw-r--r-- | searx/engines/gigablast.py | 9 | ||||
-rw-r--r-- | searx/engines/wikipedia.py | 2 |
2 files changed, 8 insertions, 3 deletions
diff --git a/searx/engines/gigablast.py b/searx/engines/gigablast.py index 827b9cd03..0c1d7f613 100644 --- a/searx/engines/gigablast.py +++ b/searx/engines/gigablast.py @@ -95,8 +95,13 @@ def _fetch_supported_languages(resp): dom = fromstring(resp.text) links = dom.xpath('//span[@id="menu2"]/a') for link in links: - code = link.xpath('./@href')[0][-2:] - if code != 'xx' and code not in supported_languages: + href = link.xpath('./@href')[0].split('lang%3A') + if len(href) == 2: + code = href[1].split('_') + if len(code) == 2: + code = code[0] + '-' + code[1].upper() + else: + code = code[0] supported_languages.append(code) return supported_languages diff --git a/searx/engines/wikipedia.py b/searx/engines/wikipedia.py index 78acd349d..3af8f1c71 100644 --- a/searx/engines/wikipedia.py +++ b/searx/engines/wikipedia.py @@ -132,7 +132,7 @@ def _fetch_supported_languages(resp): english_name = td[1].xpath('./a')[0].text articles = int(td[4].xpath('./a/b')[0].text.replace(',', '')) # exclude languages with too few articles - if articles >= 100000: + if articles >= 100: supported_languages[code] = {"name": name, "english_name": english_name, "articles": articles} return supported_languages |