diff options
author | Cqoicebordel <Cqoicebordel@users.noreply.github.com> | 2015-06-09 16:16:07 +0200 |
---|---|---|
committer | Cqoicebordel <Cqoicebordel@users.noreply.github.com> | 2015-06-09 16:16:07 +0200 |
commit | 617495cca8b2799945be2c2b042dcc7ce905741a (patch) | |
tree | b5abd686998cd30ee53686d7867b0a127fb88dbf /searx/plugins/tracker_url_remover.py | |
parent | 4e28f12bfcc73b47f382bceedb5b65ee314674ae (diff) | |
download | searxng-617495cca8b2799945be2c2b042dcc7ce905741a.tar.gz searxng-617495cca8b2799945be2c2b042dcc7ce905741a.zip |
Add a plugin to remove trackers from results URLs
Diffstat (limited to 'searx/plugins/tracker_url_remover.py')
-rw-r--r-- | searx/plugins/tracker_url_remover.py | 40 |
1 files changed, 40 insertions, 0 deletions
diff --git a/searx/plugins/tracker_url_remover.py b/searx/plugins/tracker_url_remover.py new file mode 100644 index 000000000..c8459548f --- /dev/null +++ b/searx/plugins/tracker_url_remover.py @@ -0,0 +1,40 @@ +''' +searx is free software: you can redistribute it and/or modify +it under the terms of the GNU Affero General Public License as published by +the Free Software Foundation, either version 3 of the License, or +(at your option) any later version. + +searx is distributed in the hope that it will be useful, +but WITHOUT ANY WARRANTY; without even the implied warranty of +MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +GNU Affero General Public License for more details. + +You should have received a copy of the GNU Affero General Public License +along with searx. If not, see < http://www.gnu.org/licenses/ >. + +(C) 2015 by Adam Tauber, <asciimoo@gmail.com> +''' + +from flask.ext.babel import gettext +import re + +re1 = re.compile(r'utm_[^&]+&?') +re2 = re.compile(r'(wkey|wemail)[^&]+&?') +re3 = re.compile(r'&$') +re4 = re.compile(r'^\?$') + +name = gettext('Tracker URL remover') +description = gettext('Remove trackers arguments from the returned URL') +default_on = True + + +def on_result(request, ctx): + url = ctx['result']['url'] + + url = re1.sub('', url) + url = re2.sub('', url) + url = re3.sub('', url) + url = re4.sub('', url) + + ctx['result']['url'] = url + return True |