diff options
author | Thomas Pointhuber <thomas.pointhuber@gmx.at> | 2015-08-24 11:28:55 +0200 |
---|---|---|
committer | Thomas Pointhuber <thomas.pointhuber@gmx.at> | 2015-08-24 11:28:55 +0200 |
commit | 23b9095cbf2d31a1495ee3d63a55bd81548cd367 (patch) | |
tree | aa09c965a14106f475cf68fef3b230f1e70fe798 /searx/engines/startpage.py | |
parent | 5bffa9ca33f8ec98baebca13ee9b16262bfe4e8d (diff) | |
download | searxng-23b9095cbf2d31a1495ee3d63a55bd81548cd367.tar.gz searxng-23b9095cbf2d31a1495ee3d63a55bd81548cd367.zip |
[fix] improve result handling of startpage engine
Diffstat (limited to 'searx/engines/startpage.py')
-rw-r--r-- | searx/engines/startpage.py | 6 |
1 files changed, 5 insertions, 1 deletions
diff --git a/searx/engines/startpage.py b/searx/engines/startpage.py index 9d5b4befe..08e4f7a5b 100644 --- a/searx/engines/startpage.py +++ b/searx/engines/startpage.py @@ -66,7 +66,11 @@ def response(resp): url = link.attrib.get('href') # block google-ad url's - if re.match("^http(s|)://www.google.[a-z]+/aclk.*$", url): + if re.match("^http(s|)://(www\.)?google\.[a-z]+/aclk.*$", url): + continue + + # block startpage search url's + if re.match("^http(s|)://(www\.)?startpage\.com/do/search\?.*$", url): continue title = escape(extract_text(link)) |