2015-06-09 14:16:07 +00:00
|
|
|
'''
|
|
|
|
searx is free software: you can redistribute it and/or modify
|
|
|
|
it under the terms of the GNU Affero General Public License as published by
|
|
|
|
the Free Software Foundation, either version 3 of the License, or
|
|
|
|
(at your option) any later version.
|
|
|
|
|
|
|
|
searx is distributed in the hope that it will be useful,
|
|
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
GNU Affero General Public License for more details.
|
|
|
|
|
|
|
|
You should have received a copy of the GNU Affero General Public License
|
|
|
|
along with searx. If not, see < http://www.gnu.org/licenses/ >.
|
|
|
|
|
|
|
|
(C) 2015 by Adam Tauber, <asciimoo@gmail.com>
|
|
|
|
'''
|
|
|
|
|
|
|
|
from flask.ext.babel import gettext
|
|
|
|
import re
|
2015-06-18 12:27:15 +00:00
|
|
|
from urlparse import urlunparse
|
2015-06-09 14:16:07 +00:00
|
|
|
|
2015-06-15 18:34:02 +00:00
|
|
|
regexes = {re.compile(r'utm_[^&]+&?'),
|
|
|
|
re.compile(r'(wkey|wemail)[^&]+&?'),
|
|
|
|
re.compile(r'&$')}
|
2015-06-09 14:16:07 +00:00
|
|
|
|
|
|
|
name = gettext('Tracker URL remover')
|
|
|
|
description = gettext('Remove trackers arguments from the returned URL')
|
|
|
|
default_on = True
|
|
|
|
|
|
|
|
|
|
|
|
def on_result(request, ctx):
|
2015-06-18 12:27:15 +00:00
|
|
|
query = ctx['result']['parsed_url'].query
|
2015-06-09 14:16:07 +00:00
|
|
|
|
2015-06-18 12:27:15 +00:00
|
|
|
if query == "":
|
2015-06-15 18:34:02 +00:00
|
|
|
return True
|
|
|
|
|
|
|
|
for reg in regexes:
|
2015-06-18 12:27:15 +00:00
|
|
|
query = reg.sub('', query)
|
2015-06-15 18:34:02 +00:00
|
|
|
|
2015-06-18 12:27:15 +00:00
|
|
|
if query != ctx['result']['parsed_url'].query:
|
|
|
|
ctx['result']['parsed_url'] = ctx['result']['parsed_url']._replace(query=query)
|
|
|
|
ctx['result']['url'] = urlunparse(ctx['result']['parsed_url'])
|
2015-06-09 14:16:07 +00:00
|
|
|
|
|
|
|
return True
|