| 
									
										
										
										
											2015-06-09 16:16:07 +02:00
										 |  |  | '''
 | 
					
						
							|  |  |  | searx is free software: you can redistribute it and/or modify | 
					
						
							|  |  |  | it under the terms of the GNU Affero General Public License as published by | 
					
						
							|  |  |  | the Free Software Foundation, either version 3 of the License, or | 
					
						
							|  |  |  | (at your option) any later version. | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | searx is distributed in the hope that it will be useful, | 
					
						
							|  |  |  | but WITHOUT ANY WARRANTY; without even the implied warranty of | 
					
						
							|  |  |  | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the | 
					
						
							|  |  |  | GNU Affero General Public License for more details. | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | You should have received a copy of the GNU Affero General Public License | 
					
						
							|  |  |  | along with searx. If not, see < http://www.gnu.org/licenses/ >. | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | (C) 2015 by Adam Tauber, <asciimoo@gmail.com> | 
					
						
							|  |  |  | '''
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | from flask.ext.babel import gettext | 
					
						
							|  |  |  | import re | 
					
						
							| 
									
										
										
										
											2015-06-18 14:27:15 +02:00
										 |  |  | from urlparse import urlunparse | 
					
						
							| 
									
										
										
										
											2015-06-09 16:16:07 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-06-15 20:34:02 +02:00
										 |  |  | regexes = {re.compile(r'utm_[^&]+&?'), | 
					
						
							|  |  |  |            re.compile(r'(wkey|wemail)[^&]+&?'), | 
					
						
							|  |  |  |            re.compile(r'&$')} | 
					
						
							| 
									
										
										
										
											2015-06-09 16:16:07 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  | name = gettext('Tracker URL remover') | 
					
						
							|  |  |  | description = gettext('Remove trackers arguments from the returned URL') | 
					
						
							|  |  |  | default_on = True | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | def on_result(request, ctx): | 
					
						
							| 
									
										
										
										
											2015-06-18 14:27:15 +02:00
										 |  |  |     query = ctx['result']['parsed_url'].query | 
					
						
							| 
									
										
										
										
											2015-06-09 16:16:07 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-06-18 14:27:15 +02:00
										 |  |  |     if query == "": | 
					
						
							| 
									
										
										
										
											2015-06-15 20:34:02 +02:00
										 |  |  |         return True | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     for reg in regexes: | 
					
						
							| 
									
										
										
										
											2015-06-18 14:27:15 +02:00
										 |  |  |         query = reg.sub('', query) | 
					
						
							| 
									
										
										
										
											2015-06-15 20:34:02 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-06-18 14:27:15 +02:00
										 |  |  |     if query != ctx['result']['parsed_url'].query: | 
					
						
							|  |  |  |         ctx['result']['parsed_url'] = ctx['result']['parsed_url']._replace(query=query) | 
					
						
							|  |  |  |         ctx['result']['url'] = urlunparse(ctx['result']['parsed_url']) | 
					
						
							| 
									
										
										
										
											2015-06-09 16:16:07 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  |     return True |