| 
									
										
										
										
											2021-01-13 11:31:25 +01:00
										 |  |  | # SPDX-License-Identifier: AGPL-3.0-or-later | 
					
						
							| 
									
										
										
										
											2020-08-08 19:22:53 +02:00
										 |  |  | """
 | 
					
						
							|  |  |  |  peertube (Videos) | 
					
						
							|  |  |  | """
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | from json import loads | 
					
						
							|  |  |  | from datetime import datetime | 
					
						
							| 
									
										
										
										
											2020-08-06 17:42:46 +02:00
										 |  |  | from urllib.parse import urlencode | 
					
						
							| 
									
										
										
										
											2020-08-08 19:22:53 +02:00
										 |  |  | from searx.utils import html_to_text | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-01-13 11:31:25 +01:00
										 |  |  | # about | 
					
						
							|  |  |  | about = { | 
					
						
							|  |  |  |     "website": 'https://joinpeertube.org', | 
					
						
							|  |  |  |     "wikidata_id": 'Q50938515', | 
					
						
							|  |  |  |     "official_api_documentation": 'https://docs.joinpeertube.org/api-rest-reference.html', | 
					
						
							|  |  |  |     "use_official_api": True, | 
					
						
							|  |  |  |     "require_api_key": False, | 
					
						
							|  |  |  |     "results": 'JSON', | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-08-08 19:22:53 +02:00
										 |  |  | # engine dependent config | 
					
						
							|  |  |  | categories = ["videos"] | 
					
						
							|  |  |  | paging = True | 
					
						
							| 
									
										
										
										
											2021-02-13 19:47:33 +01:00
										 |  |  | base_url = "https://peer.tube" | 
					
						
							| 
									
										
										
										
											2021-06-04 11:09:36 +02:00
										 |  |  | supported_languages_url = ( | 
					
						
							|  |  |  |     'https://framagit.org/framasoft/peertube/search-index/-/raw/master/client/src/views/Search.vue' | 
					
						
							|  |  |  | ) | 
					
						
							| 
									
										
										
										
											2020-08-08 19:22:53 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | # do search-request | 
					
						
							|  |  |  | def request(query, params): | 
					
						
							| 
									
										
										
										
											2021-02-13 19:47:33 +01:00
										 |  |  |     sanitized_url = base_url.rstrip("/") | 
					
						
							| 
									
										
										
										
											2020-08-08 19:22:53 +02:00
										 |  |  |     pageno = (params["pageno"] - 1) * 15 | 
					
						
							| 
									
										
										
										
											2021-02-13 19:47:33 +01:00
										 |  |  |     search_url = sanitized_url + "/api/v1/search/videos/?pageno={pageno}&{query}" | 
					
						
							| 
									
										
										
										
											2020-08-08 19:22:53 +02:00
										 |  |  |     query_dict = {"search": query} | 
					
						
							|  |  |  |     language = params["language"].split("-")[0] | 
					
						
							|  |  |  |     if "all" != language and language in supported_languages: | 
					
						
							|  |  |  |         query_dict["languageOneOf"] = language | 
					
						
							|  |  |  |     params["url"] = search_url.format( | 
					
						
							|  |  |  |         query=urlencode(query_dict), pageno=pageno | 
					
						
							|  |  |  |     ) | 
					
						
							|  |  |  |     return params | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | def _get_offset_from_pageno(pageno): | 
					
						
							|  |  |  |     return (pageno - 1) * 15 + 1 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | # get response from search-request | 
					
						
							|  |  |  | def response(resp): | 
					
						
							| 
									
										
										
										
											2021-02-13 19:47:33 +01:00
										 |  |  |     sanitized_url = base_url.rstrip("/") | 
					
						
							| 
									
										
										
										
											2020-08-08 19:22:53 +02:00
										 |  |  |     results = [] | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     search_res = loads(resp.text) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     embedded_url = ( | 
					
						
							|  |  |  |         '<iframe width="560" height="315" sandbox="allow-same-origin allow-scripts allow-popups" ' | 
					
						
							|  |  |  |         + 'src="' | 
					
						
							| 
									
										
										
										
											2021-02-13 19:47:33 +01:00
										 |  |  |         + sanitized_url | 
					
						
							| 
									
										
										
										
											2020-08-08 19:22:53 +02:00
										 |  |  |         + '{embed_path}" frameborder="0" allowfullscreen></iframe>' | 
					
						
							|  |  |  |     ) | 
					
						
							|  |  |  |     # return empty array if there are no results | 
					
						
							|  |  |  |     if "data" not in search_res: | 
					
						
							|  |  |  |         return [] | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     # parse results | 
					
						
							|  |  |  |     for res in search_res["data"]: | 
					
						
							|  |  |  |         title = res["name"] | 
					
						
							| 
									
										
										
										
											2021-02-13 19:47:33 +01:00
										 |  |  |         url = sanitized_url + "/videos/watch/" + res["uuid"] | 
					
						
							| 
									
										
										
										
											2020-08-08 19:22:53 +02:00
										 |  |  |         description = res["description"] | 
					
						
							|  |  |  |         if description: | 
					
						
							|  |  |  |             content = html_to_text(res["description"]) | 
					
						
							|  |  |  |         else: | 
					
						
							| 
									
										
										
										
											2021-02-13 19:47:33 +01:00
										 |  |  |             content = "" | 
					
						
							|  |  |  |         thumbnail = sanitized_url + res["thumbnailPath"] | 
					
						
							| 
									
										
										
										
											2020-08-08 19:22:53 +02:00
										 |  |  |         publishedDate = datetime.strptime(res["publishedAt"], "%Y-%m-%dT%H:%M:%S.%fZ") | 
					
						
							| 
									
										
										
										
											2021-02-13 19:47:33 +01:00
										 |  |  |         embedded = embedded_url.format(embed_path=res["embedPath"]) | 
					
						
							| 
									
										
										
										
											2020-08-08 19:22:53 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  |         results.append( | 
					
						
							|  |  |  |             { | 
					
						
							|  |  |  |                 "template": "videos.html", | 
					
						
							|  |  |  |                 "url": url, | 
					
						
							|  |  |  |                 "title": title, | 
					
						
							|  |  |  |                 "content": content, | 
					
						
							|  |  |  |                 "publishedDate": publishedDate, | 
					
						
							|  |  |  |                 "embedded": embedded, | 
					
						
							|  |  |  |                 "thumbnail": thumbnail, | 
					
						
							|  |  |  |             } | 
					
						
							|  |  |  |         ) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     # return results | 
					
						
							|  |  |  |     return results | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | def _fetch_supported_languages(resp): | 
					
						
							| 
									
										
										
										
											2021-06-04 11:09:36 +02:00
										 |  |  |     import re | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     # https://docs.python.org/3/howto/regex.html#greedy-versus-non-greedy | 
					
						
							| 
									
										
										
										
											2021-07-23 12:03:16 +02:00
										 |  |  |     videolanguages = re.search(r"videoLanguages \(\)[^\n]+(.*?)\]", resp.text, re.DOTALL) | 
					
						
							| 
									
										
										
										
											2021-06-04 11:09:36 +02:00
										 |  |  |     peertube_languages = [m.group(1) for m in re.finditer(r"\{ id: '([a-z]+)', label:", videolanguages.group(1))] | 
					
						
							| 
									
										
										
										
											2020-08-08 19:22:53 +02:00
										 |  |  |     return peertube_languages |