mirror of
https://github.com/searxng/searxng.git
synced 2024-11-16 17:40:11 +01:00
2ca0aa4f29
More information here: https://knowledge.hubspot.com/settings/how-do-i-create-a-tracking-url https://knowledge.hubspot.com/ads/ad-tracking-in-hubspot https://knowledge.hubspot.com/ctas/calls-to-action-frequently-asked-questions https://meta.stackexchange.com/questions/263392/what-are-these-very-long-parameters-in-so-careers-feedback-always-welcome-url
54 lines
1.7 KiB
Python
54 lines
1.7 KiB
Python
'''
|
|
searx is free software: you can redistribute it and/or modify
|
|
it under the terms of the GNU Affero General Public License as published by
|
|
the Free Software Foundation, either version 3 of the License, or
|
|
(at your option) any later version.
|
|
|
|
searx is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU Affero General Public License for more details.
|
|
|
|
You should have received a copy of the GNU Affero General Public License
|
|
along with searx. If not, see < http://www.gnu.org/licenses/ >.
|
|
|
|
(C) 2015 by Adam Tauber, <asciimoo@gmail.com>
|
|
'''
|
|
|
|
from flask_babel import gettext
|
|
import re
|
|
from urllib.parse import urlunparse, parse_qsl, urlencode
|
|
|
|
regexes = {re.compile(r'utm_[^&]+'),
|
|
re.compile(r'(wkey|wemail)[^&]*'),
|
|
re.compile(r'(_hsenc|_hsmi|hsCtaTracking|__hssc|__hstc|__hsfp)[^&]*'),
|
|
re.compile(r'&$')}
|
|
|
|
name = gettext('Tracker URL remover')
|
|
description = gettext('Remove trackers arguments from the returned URL')
|
|
default_on = True
|
|
preference_section = 'privacy'
|
|
|
|
|
|
def on_result(request, search, result):
|
|
if 'parsed_url' not in result:
|
|
return True
|
|
|
|
query = result['parsed_url'].query
|
|
|
|
if query == "":
|
|
return True
|
|
parsed_query = parse_qsl(query)
|
|
|
|
changes = 0
|
|
for i, (param_name, _) in enumerate(list(parsed_query)):
|
|
for reg in regexes:
|
|
if reg.match(param_name):
|
|
parsed_query.pop(i - changes)
|
|
changes += 1
|
|
result['parsed_url'] = result['parsed_url']._replace(query=urlencode(parsed_query))
|
|
result['url'] = urlunparse(result['parsed_url'])
|
|
break
|
|
|
|
return True
|