summaryrefslogtreecommitdiff
path: root/searx/plugins/tracker_url_remover.py
diff options
context:
space:
mode:
Diffstat (limited to 'searx/plugins/tracker_url_remover.py')
-rw-r--r--searx/plugins/tracker_url_remover.py52
1 files changed, 52 insertions, 0 deletions
diff --git a/searx/plugins/tracker_url_remover.py b/searx/plugins/tracker_url_remover.py
new file mode 100644
index 000000000..33dd621e1
--- /dev/null
+++ b/searx/plugins/tracker_url_remover.py
@@ -0,0 +1,52 @@
+'''
+searx is free software: you can redistribute it and/or modify
+it under the terms of the GNU Affero General Public License as published by
+the Free Software Foundation, either version 3 of the License, or
+(at your option) any later version.
+
+searx is distributed in the hope that it will be useful,
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+GNU Affero General Public License for more details.
+
+You should have received a copy of the GNU Affero General Public License
+along with searx. If not, see < http://www.gnu.org/licenses/ >.
+
+(C) 2015 by Adam Tauber, <asciimoo@gmail.com>
+'''
+
+from flask_babel import gettext
+import re
+from searx.url_utils import urlunparse, parse_qsl, urlencode
+
+regexes = {re.compile(r'utm_[^&]+'),
+ re.compile(r'(wkey|wemail)[^&]*'),
+ re.compile(r'&$')}
+
+name = gettext('Tracker URL remover')
+description = gettext('Remove trackers arguments from the returned URL')
+default_on = True
+preference_section = 'privacy'
+
+
+def on_result(request, search, result):
+ if 'parsed_url' not in result:
+ return True
+
+ query = result['parsed_url'].query
+
+ if query == "":
+ return True
+ parsed_query = parse_qsl(query)
+
+ changes = 0
+ for i, (param_name, _) in enumerate(list(parsed_query)):
+ for reg in regexes:
+ if reg.match(param_name):
+ parsed_query.pop(i - changes)
+ changes += 1
+ result['parsed_url'] = result['parsed_url']._replace(query=urlencode(parsed_query))
+ result['url'] = urlunparse(result['parsed_url'])
+ break
+
+ return True