123456789101112131415161718192021222324252627282930313233343536373839404142434445 |
- # SPDX-License-Identifier: AGPL-3.0-or-later
- # pylint: disable=missing-module-docstring
- from __future__ import annotations
- import re
- from urllib.parse import urlunparse, parse_qsl, urlencode
- from flask_babel import gettext
- regexes = {
- re.compile(r'utm_[^&]+'),
- re.compile(r'(wkey|wemail)[^&]*'),
- re.compile(r'(_hsenc|_hsmi|hsCtaTracking|__hssc|__hstc|__hsfp)[^&]*'),
- re.compile(r'&$'),
- }
- name = gettext('Tracker URL remover')
- description = gettext('Remove trackers arguments from the returned URL')
- default_on = True
- preference_section = 'privacy'
- def on_result(_request, _search, result) -> bool:
- parsed_url = getattr(result, "parsed_url", None)
- if not parsed_url:
- return True
- if parsed_url.query == "":
- return True
- parsed_query = parse_qsl(parsed_url.query)
- changes = 0
- for i, (param_name, _) in enumerate(list(parsed_query)):
- for reg in regexes:
- if reg.match(param_name):
- parsed_query.pop(i - changes)
- changes += 1
- result.parsed_url = result.parsed_url._replace(query=urlencode(parsed_query))
- result.url = urlunparse(result.parsed_url)
- break
- return True
|