diff options
author | Markus Heiser <markus.heiser@darmarIT.de> | 2022-08-10 20:50:45 +0200 |
---|---|---|
committer | GitHub <noreply@github.com> | 2022-08-10 20:50:45 +0200 |
commit | 43c545910b161731c3bc6791bdfa227c64e4489a (patch) | |
tree | ca9b92100822cc2ddc90b5232815239d9fb72b1c /searx | |
parent | 5706d110f2580a9c84618060d017a92405cf44e2 (diff) | |
parent | eb02cc77c56c8e93d305ee8aafc6e80c326e838f (diff) | |
download | searxng-43c545910b161731c3bc6791bdfa227c64e4489a.tar.gz searxng-43c545910b161731c3bc6791bdfa227c64e4489a.zip |
Merge pull request #1648 from unixfox/google_mobile_ui_parameter
output format protobuf to HTML for google mobile
Diffstat (limited to 'searx')
-rw-r--r-- | searx/engines/google.py | 17 |
1 files changed, 5 insertions, 12 deletions
diff --git a/searx/engines/google.py b/searx/engines/google.py index 5e80f6dcc..9cb936ccf 100644 --- a/searx/engines/google.py +++ b/searx/engines/google.py @@ -112,21 +112,14 @@ filter_mapping = {0: 'off', 1: 'medium', 2: 'high'} # specific xpath variables # ------------------------ -# google results are grouped into <div class="jtfYYd ..." ../> -results_xpath = '//div[contains(@class, "jtfYYd")]' +results_xpath = '//div[contains(@class, "MjjYud")]' +title_xpath = './/h3[1]' +href_xpath = './/a/@href' +content_xpath = './/div[@data-content-feature=1]' # google *sections* are no usual *results*, we ignore them g_section_with_header = './g-section-with-header' -# the title is a h3 tag relative to the result group -title_xpath = './/h3[1]' - -# in the result group there is <div class="yuRUbf" ../> it's first child is a <a -# href=...> -href_xpath = './/div[@class="yuRUbf"]//a/@href' - -# in the result group there is <div class="VwiC3b ..." ../> containing the *content* -content_xpath = './/div[contains(@class, "VwiC3b")]' # Suggestions are links placed in a *card-section*, we extract only the text # from the links not the links itself. @@ -261,7 +254,7 @@ def request(query, params): if use_mobile_ui: additional_parameters = { 'asearch': 'arc', - 'async': 'use_ac:true,_fmt:pc', + 'async': 'use_ac:true,_fmt:html', } # https://www.google.de/search?q=corona&hl=de&lr=lang_de&start=0&tbs=qdr%3Ad&safe=medium |