Fix relative urls that do not start with '/'
This commit is contained in:
		
							parent
							
								
									9f2446c444
								
							
						
					
					
						commit
						1d4657b714
					
				| @ -61,6 +61,10 @@ def extract_url(xpath_results, search_url): | |||||||
|         # fix relative url to the search engine |         # fix relative url to the search engine | ||||||
|         url = urljoin(search_url, url) |         url = urljoin(search_url, url) | ||||||
| 
 | 
 | ||||||
|  |     # fix relative urls that fall through the crack | ||||||
|  |     if '://' not in url: | ||||||
|  |         url = urljoin(search_url, url) | ||||||
|  | 
 | ||||||
|     # normalize url |     # normalize url | ||||||
|     url = normalize_url(url) |     url = normalize_url(url) | ||||||
| 
 | 
 | ||||||
|  | |||||||
		Loading…
	
		Reference in New Issue
	
	Block a user