diff options
author | Noémi Ványi <kvch@users.noreply.github.com> | 2019-01-04 22:14:40 +0100 |
---|---|---|
committer | GitHub <noreply@github.com> | 2019-01-04 22:14:40 +0100 |
commit | aeb6dab1872921fc129d47830620ae78bc185e53 (patch) | |
tree | 48097abd82e8e41f1022c16fc5aa46f5ee78914d | |
parent | 0d86ed9c7e274c69bcee4bca838e19ec4f632699 (diff) | |
parent | 82bf9c6b290423b5b7b300fc3af68bbfa32f3d4f (diff) | |
download | searxng-aeb6dab1872921fc129d47830620ae78bc185e53.tar.gz searxng-aeb6dab1872921fc129d47830620ae78bc185e53.zip |
Merge branch 'master' into master
-rw-r--r-- | searx/engines/bing_images.py | 4 | ||||
-rw-r--r-- | searx/engines/startpage.py | 7 | ||||
-rw-r--r-- | tests/unit/engines/test_bing_images.py | 6 | ||||
-rw-r--r-- | tests/unit/engines/test_startpage.py | 22 |
4 files changed, 19 insertions, 20 deletions
diff --git a/searx/engines/bing_images.py b/searx/engines/bing_images.py index 66e14c01f..876011f1d 100644 --- a/searx/engines/bing_images.py +++ b/searx/engines/bing_images.py @@ -88,9 +88,7 @@ def response(resp): url = json_data.get('purl') img_src = json_data.get('murl') - - thumb_json_data = loads(_quote_keys_regex.sub(r'\1"\2": \3', link.attrib.get('mad'))) - thumbnail = thumb_json_data.get('turl') + thumbnail = json_data.get('turl') # append result results.append({'template': 'images.html', diff --git a/searx/engines/startpage.py b/searx/engines/startpage.py index a52d9128d..55efdc884 100644 --- a/searx/engines/startpage.py +++ b/searx/engines/startpage.py @@ -32,8 +32,9 @@ search_url = base_url + 'do/search' # specific xpath variables # ads xpath //div[@id="results"]/div[@id="sponsored"]//div[@class="result"] # not ads: div[@class="result"] are the direct childs of div[@id="results"] -results_xpath = '//div[@class="result"]' +results_xpath = '//li[contains(@class, "search-result") and contains(@class, "search-item")]' link_xpath = './/h3/a' +content_xpath = './p[@class="search-item__body"]' # do search-request @@ -75,8 +76,8 @@ def response(resp): title = extract_text(link) - if result.xpath('./p[@class="desc clk"]'): - content = extract_text(result.xpath('./p[@class="desc clk"]')) + if result.xpath(content_xpath): + content = extract_text(result.xpath(content_xpath)) else: content = '' diff --git a/tests/unit/engines/test_bing_images.py b/tests/unit/engines/test_bing_images.py index afc4cd6f0..cb1d550d9 100644 --- a/tests/unit/engines/test_bing_images.py +++ b/tests/unit/engines/test_bing_images.py @@ -52,7 +52,7 @@ class TestBingImagesEngine(SearxTestCase): <li> <div> <div class="imgpt"> - <a m='{"purl":"page_url","murl":"img_url"}' mad='{"turl":"thumb_url"}'> + <a m='{"purl":"page_url","murl":"img_url","turl":"thumb_url"}'> <img src="" alt="alt text" /> </a> </div> @@ -60,7 +60,7 @@ class TestBingImagesEngine(SearxTestCase): </div> <div> <div class="imgpt"> - <a m='{"purl":"page_url2","murl":"img_url2"}' mad='{"turl":"thumb_url2"}'> + <a m='{"purl":"page_url2","murl":"img_url2","turl":"thumb_url2"}'> <img src="" alt="alt text 2" /> </a> </div> @@ -71,7 +71,7 @@ class TestBingImagesEngine(SearxTestCase): <li> <div> <div class="imgpt"> - <a m='{"purl":"page_url3","murl":"img_url3"}' mad='{"turl":"thumb_url3"}'> + <a m='{"purl":"page_url3","murl":"img_url3","turl":"thumb_url3"}'> <img src="" alt="alt text 3" /> </a> </div> diff --git a/tests/unit/engines/test_startpage.py b/tests/unit/engines/test_startpage.py index bdb3356b7..4a8a443dd 100644 --- a/tests/unit/engines/test_startpage.py +++ b/tests/unit/engines/test_startpage.py @@ -31,14 +31,14 @@ class TestStartpageEngine(SearxTestCase): self.assertEqual(startpage.response(response), []) html = """ - <div class='result' style=' *width : auto; *margin-right : 10%;'> + <li class="search-result search-item"> <h3> <a href='http://this.should.be.the.link/' id='title_2' name='title_2' > This should be the title </a> <span id='title_stars_2' name='title_stars_2'> </span> </h3> - <p class='desc clk'> + <p class="search-item__body"> This should be the content. </p> <p> @@ -56,7 +56,7 @@ class TestStartpageEngine(SearxTestCase): Mis en surbrillance </A> </p> - </div> + </li> """ response = mock.Mock(text=html.encode('utf-8')) results = startpage.response(response) @@ -67,14 +67,14 @@ class TestStartpageEngine(SearxTestCase): self.assertEqual(results[0]['content'], 'This should be the content.') html = """ - <div class='result' style=' *width : auto; *margin-right : 10%;'> + <li class="search-result search-item"> <h3> <a href='http://www.google.com/aclk?sa=l&ai=C' id='title_2' name='title_2' > This should be the title </a> <span id='title_stars_2' name='title_stars_2'> </span> </h3> - <p class='desc clk'> + <p class="search-item__body"> This should be the content. </p> <p> @@ -92,20 +92,20 @@ class TestStartpageEngine(SearxTestCase): Mis en surbrillance </A> </p> - </div> - <div class='result' style=' *width : auto; *margin-right : 10%;'> + </li> + <li class="search-result search-item"> <h3> <span id='title_stars_2' name='title_stars_2'> </span> </h3> - <p class='desc clk'> + <p class="search-item__body"> This should be the content. </p> <p> <span class='url'>www.speed<b>test</b>.net/fr/ </span> </p> - </div> - <div class='result' style=' *width : auto; *margin-right : 10%;'> + </li> + <li class="search-result search-item"> <h3> <a href='http://this.should.be.the.link/' id='title_2' name='title_2' > This should be the title @@ -127,7 +127,7 @@ class TestStartpageEngine(SearxTestCase): Mis en surbrillance </A> </p> - </div> + </li> """ response = mock.Mock(text=html.encode('utf-8')) results = startpage.response(response) |