| 
									
										
										
										
											2021-03-13 20:27:47 +01:00
										 |  |  | # SPDX-License-Identifier: AGPL-3.0-or-later | 
					
						
							| 
									
										
										
										
											2021-04-26 20:18:20 +02:00
										 |  |  | # lint: pylint | 
					
						
							| 
									
										
										
										
											2021-03-13 20:27:47 +01:00
										 |  |  | """
 | 
					
						
							|  |  |  |  Solr | 
					
						
							|  |  |  | """
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-09-07 13:26:59 +02:00
										 |  |  | # pylint: disable=global-statement | 
					
						
							| 
									
										
										
										
											2021-03-13 20:27:47 +01:00
										 |  |  | 
 | 
					
						
							|  |  |  | from json import loads | 
					
						
							|  |  |  | from urllib.parse import urlencode | 
					
						
							|  |  |  | from searx.exceptions import SearxEngineAPIException | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | base_url = 'http://localhost:8983' | 
					
						
							|  |  |  | collection = '' | 
					
						
							|  |  |  | rows = 10 | 
					
						
							|  |  |  | sort = '' # sorting: asc or desc | 
					
						
							|  |  |  | field_list = 'name' # list of field names to display on the UI | 
					
						
							|  |  |  | default_fields = '' # default field to query | 
					
						
							|  |  |  | query_fields = '' # query fields | 
					
						
							|  |  |  | _search_url = '' | 
					
						
							|  |  |  | paging = True | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | def init(_): | 
					
						
							|  |  |  |     if collection == '': | 
					
						
							|  |  |  |         raise ValueError('collection cannot be empty') | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     global _search_url | 
					
						
							|  |  |  |     _search_url = base_url + '/solr/' + collection + '/select?{params}' | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | def request(query, params): | 
					
						
							|  |  |  |     query_params = {'q': query, 'rows': rows} | 
					
						
							|  |  |  |     if field_list != '': | 
					
						
							|  |  |  |         query_params['fl'] = field_list | 
					
						
							|  |  |  |     if query_fields != '': | 
					
						
							|  |  |  |         query_params['qf'] = query_fields | 
					
						
							|  |  |  |     if default_fields != '': | 
					
						
							|  |  |  |         query_params['df'] = default_fields | 
					
						
							|  |  |  |     if sort != '': | 
					
						
							|  |  |  |         query_params['sort'] = sort | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     if 'pageno' in params: | 
					
						
							|  |  |  |         query_params['start'] = rows * (params['pageno'] - 1) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     params['url'] = _search_url.format(params=urlencode(query_params)) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     return params | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | def response(resp): | 
					
						
							|  |  |  |     resp_json = __get_response(resp) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     results = [] | 
					
						
							|  |  |  |     for result in resp_json['response']['docs']: | 
					
						
							|  |  |  |         r = {key: str(value) for key, value in result.items()} | 
					
						
							|  |  |  |         if len(r) == 0: | 
					
						
							|  |  |  |             continue | 
					
						
							|  |  |  |         r['template'] = 'key-value.html' | 
					
						
							|  |  |  |         results.append(r) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     return results | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | def __get_response(resp): | 
					
						
							|  |  |  |     try: | 
					
						
							|  |  |  |         resp_json = loads(resp.text) | 
					
						
							|  |  |  |     except Exception as e: | 
					
						
							|  |  |  |         raise SearxEngineAPIException("failed to parse response") from e | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     if 'error' in resp_json: | 
					
						
							|  |  |  |         raise SearxEngineAPIException(resp_json['error']['msg']) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     return resp_json |