|  | # SPDX-License-Identifier: AGPL-3.0-or-later
 | 
						
						
						
							|  | # pylint: disable=missing-module-docstring
 | 
						
						
						
							|  | 
 | 
						
						
						
							|  | from __future__ import annotations
 | 
						
						
						
							|  | 
 | 
						
						
						
							|  | import re
 | 
						
						
						
							|  | from urllib.parse import urlunparse, parse_qsl, urlencode
 | 
						
						
						
							|  | 
 | 
						
						
						
							|  | from flask_babel import gettext
 | 
						
						
						
							|  | 
 | 
						
						
						
							|  | regexes = {
 | 
						
						
						
							|  |     re.compile(r'utm_[^&]+'),
 | 
						
						
						
							|  |     re.compile(r'(wkey|wemail)[^&]*'),
 | 
						
						
						
							|  |     re.compile(r'(_hsenc|_hsmi|hsCtaTracking|__hssc|__hstc|__hsfp)[^&]*'),
 | 
						
						
						
							|  |     re.compile(r'&$'),
 | 
						
						
						
							|  | }
 | 
						
						
						
							|  | 
 | 
						
						
						
							|  | name = gettext('Tracker URL remover')
 | 
						
						
						
							|  | description = gettext('Remove trackers arguments from the returned URL')
 | 
						
						
						
							|  | default_on = True
 | 
						
						
						
							|  | preference_section = 'privacy'
 | 
						
						
						
							|  | 
 | 
						
						
						
							|  | 
 | 
						
						
						
							|  | def on_result(_request, _search, result) -> bool:
 | 
						
						
						
							|  | 
 | 
						
						
						
							|  |     parsed_url = getattr(result, "parsed_url", None)
 | 
						
						
						
							|  |     if not parsed_url:
 | 
						
						
						
							|  |         return True
 | 
						
						
						
							|  | 
 | 
						
						
						
							|  |     if parsed_url.query == "":
 | 
						
						
						
							|  |         return True
 | 
						
						
						
							|  | 
 | 
						
						
						
							|  |     parsed_query = parse_qsl(parsed_url.query)
 | 
						
						
						
							|  |     changes = 0
 | 
						
						
						
							|  |     for i, (param_name, _) in enumerate(list(parsed_query)):
 | 
						
						
						
							|  |         for reg in regexes:
 | 
						
						
						
							|  |             if reg.match(param_name):
 | 
						
						
						
							|  |                 parsed_query.pop(i - changes)
 | 
						
						
						
							|  |                 changes += 1
 | 
						
						
						
							|  |                 result.parsed_url = result.parsed_url._replace(query=urlencode(parsed_query))
 | 
						
						
						
							|  |                 result.url = urlunparse(result.parsed_url)
 | 
						
						
						
							|  |                 break
 | 
						
						
						
							|  | 
 | 
						
						
						
							|  |     return True
 |