summaryrefslogtreecommitdiff
path: root/searx/engines/startpage.py
diff options
context:
space:
mode:
authorThomas Pointhuber <thomas.pointhuber@gmx.at>2015-08-24 11:28:55 +0200
committerThomas Pointhuber <thomas.pointhuber@gmx.at>2015-08-24 11:28:55 +0200
commit23b9095cbf2d31a1495ee3d63a55bd81548cd367 (patch)
treeaa09c965a14106f475cf68fef3b230f1e70fe798 /searx/engines/startpage.py
parent5bffa9ca33f8ec98baebca13ee9b16262bfe4e8d (diff)
downloadsearxng-23b9095cbf2d31a1495ee3d63a55bd81548cd367.tar.gz
searxng-23b9095cbf2d31a1495ee3d63a55bd81548cd367.zip
[fix] improve result handling of startpage engine
Diffstat (limited to 'searx/engines/startpage.py')
-rw-r--r--searx/engines/startpage.py6
1 files changed, 5 insertions, 1 deletions
diff --git a/searx/engines/startpage.py b/searx/engines/startpage.py
index 9d5b4befe..08e4f7a5b 100644
--- a/searx/engines/startpage.py
+++ b/searx/engines/startpage.py
@@ -66,7 +66,11 @@ def response(resp):
url = link.attrib.get('href')
# block google-ad url's
- if re.match("^http(s|)://www.google.[a-z]+/aclk.*$", url):
+ if re.match("^http(s|)://(www\.)?google\.[a-z]+/aclk.*$", url):
+ continue
+
+ # block startpage search url's
+ if re.match("^http(s|)://(www\.)?startpage\.com/do/search\?.*$", url):
continue
title = escape(extract_text(link))