77 lines
		
	
	
		
			2.1 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
		
		
			
		
	
	
			77 lines
		
	
	
		
			2.1 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
|  | # SPDX-License-Identifier: AGPL-3.0-or-later | ||
|  | """Ipernity (images)""" | ||
|  | 
 | ||
|  | from datetime import datetime | ||
|  | from json import loads, JSONDecodeError | ||
|  | 
 | ||
|  | from urllib.parse import quote_plus | ||
|  | from lxml import html | ||
|  | 
 | ||
|  | from searx.utils import extr, extract_text, eval_xpath, eval_xpath_list | ||
|  | 
 | ||
|  | about = { | ||
|  |     'website': 'https://www.ipernity.com', | ||
|  |     'official_api_documentation': 'https://www.ipernity.com/help/api', | ||
|  |     'use_official_api': False, | ||
|  |     'require_api_key': False, | ||
|  |     'results': 'HTML', | ||
|  | } | ||
|  | 
 | ||
|  | paging = True | ||
|  | categories = ['images'] | ||
|  | 
 | ||
|  | 
 | ||
|  | base_url = 'https://www.ipernity.com' | ||
|  | page_size = 10 | ||
|  | 
 | ||
|  | 
 | ||
|  | def request(query, params): | ||
|  |     params['url'] = f"{base_url}/search/photo/@/page:{params['pageno']}:{page_size}?q={quote_plus(query)}" | ||
|  |     return params | ||
|  | 
 | ||
|  | 
 | ||
|  | def response(resp): | ||
|  |     results = [] | ||
|  | 
 | ||
|  |     doc = html.fromstring(resp.text) | ||
|  | 
 | ||
|  |     images = eval_xpath_list(doc, '//a[starts-with(@href, "/doc")]//img') | ||
|  | 
 | ||
|  |     result_index = 0 | ||
|  |     for result in eval_xpath_list(doc, '//script[@type="text/javascript"]'): | ||
|  |         info_js = extr(extract_text(result), '] = ', '};') + '}' | ||
|  | 
 | ||
|  |         if not info_js: | ||
|  |             continue | ||
|  | 
 | ||
|  |         try: | ||
|  |             info_item = loads(info_js) | ||
|  | 
 | ||
|  |             if not info_item.get('mediakey'): | ||
|  |                 continue | ||
|  | 
 | ||
|  |             thumbnail_src = extract_text(eval_xpath(images[result_index], './@src')) | ||
|  |             img_src = thumbnail_src.replace('240.jpg', '640.jpg') | ||
|  | 
 | ||
|  |             resolution = None | ||
|  |             if info_item.get("width") and info_item.get("height"): | ||
|  |                 resolution = f'{info_item["width"]}x{info_item["height"]}' | ||
|  | 
 | ||
|  |             item = { | ||
|  |                 'template': 'images.html', | ||
|  |                 'url': f"{base_url}/doc/{info_item['user_id']}/{info_item['doc_id']}", | ||
|  |                 'title': info_item.get('title'), | ||
|  |                 'content': info_item.get('content', ''), | ||
|  |                 'resolution': resolution, | ||
|  |                 'publishedDate': datetime.fromtimestamp(int(info_item['posted_at'])), | ||
|  |                 'thumbnail_src': thumbnail_src, | ||
|  |                 'img_src': img_src, | ||
|  |             } | ||
|  |             results.append(item) | ||
|  | 
 | ||
|  |             result_index += 1 | ||
|  |         except JSONDecodeError: | ||
|  |             continue | ||
|  | 
 | ||
|  |     return results |