| 
							
							# SPDX-License-Identifier: AGPL-3.0-or-later
 | 
						
						
						
						
							 | 
							
							# lint: pylint
 | 
						
						
						
						
							 | 
							
							"""Peertube and :py:obj:`SepiaSearch <searx.engines.sepiasearch>` do share
 | 
						
						
						
						
							 | 
							
							(more or less) the same REST API and the schema of the JSON result is identical.
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							"""
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							import re
 | 
						
						
						
						
							 | 
							
							from urllib.parse import urlencode
 | 
						
						
						
						
							 | 
							
							from datetime import datetime
 | 
						
						
						
						
							 | 
							
							from dateutil.parser import parse
 | 
						
						
						
						
							 | 
							
							from dateutil.relativedelta import relativedelta
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							import babel
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							from searx import network
 | 
						
						
						
						
							 | 
							
							from searx.locales import language_tag
 | 
						
						
						
						
							 | 
							
							from searx.utils import html_to_text
 | 
						
						
						
						
							 | 
							
							from searx.enginelib.traits import EngineTraits
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							traits: EngineTraits
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							about = {
 | 
						
						
						
						
							 | 
							
							    # pylint: disable=line-too-long
 | 
						
						
						
						
							 | 
							
							    "website": 'https://joinpeertube.org',
 | 
						
						
						
						
							 | 
							
							    "wikidata_id": 'Q50938515',
 | 
						
						
						
						
							 | 
							
							    "official_api_documentation": 'https://docs.joinpeertube.org/api-rest-reference.html#tag/Search/operation/searchVideos',
 | 
						
						
						
						
							 | 
							
							    "use_official_api": True,
 | 
						
						
						
						
							 | 
							
							    "require_api_key": False,
 | 
						
						
						
						
							 | 
							
							    "results": 'JSON',
 | 
						
						
						
						
							 | 
							
							}
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							# engine dependent config
 | 
						
						
						
						
							 | 
							
							categories = ["videos"]
 | 
						
						
						
						
							 | 
							
							paging = True
 | 
						
						
						
						
							 | 
							
							base_url = "https://peer.tube"
 | 
						
						
						
						
							 | 
							
							"""Base URL of the Peertube instance.  A list of instances is available at:
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							- https://instances.joinpeertube.org/instances
 | 
						
						
						
						
							 | 
							
							"""
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							time_range_support = True
 | 
						
						
						
						
							 | 
							
							time_range_table = {
 | 
						
						
						
						
							 | 
							
							    'day': relativedelta(),
 | 
						
						
						
						
							 | 
							
							    'week': relativedelta(weeks=-1),
 | 
						
						
						
						
							 | 
							
							    'month': relativedelta(months=-1),
 | 
						
						
						
						
							 | 
							
							    'year': relativedelta(years=-1),
 | 
						
						
						
						
							 | 
							
							}
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							safesearch = True
 | 
						
						
						
						
							 | 
							
							safesearch_table = {0: 'both', 1: 'false', 2: 'false'}
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							def minute_to_hm(minute):
 | 
						
						
						
						
							 | 
							
							    if isinstance(minute, int):
 | 
						
						
						
						
							 | 
							
							        return "%d:%02d" % (divmod(minute, 60))
 | 
						
						
						
						
							 | 
							
							    return None
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							def request(query, params):
 | 
						
						
						
						
							 | 
							
							    """Assemble request for the Peertube API"""
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							    if not query:
 | 
						
						
						
						
							 | 
							
							        return False
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							    # eng_region = traits.get_region(params['searxng_locale'], 'en_US')
 | 
						
						
						
						
							 | 
							
							    eng_lang = traits.get_language(params['searxng_locale'], None)
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							    params['url'] = (
 | 
						
						
						
						
							 | 
							
							        base_url.rstrip("/")
 | 
						
						
						
						
							 | 
							
							        + "/api/v1/search/videos?"
 | 
						
						
						
						
							 | 
							
							        + urlencode(
 | 
						
						
						
						
							 | 
							
							            {
 | 
						
						
						
						
							 | 
							
							                'search': query,
 | 
						
						
						
						
							 | 
							
							                'searchTarget': 'search-index',  # Vidiversum
 | 
						
						
						
						
							 | 
							
							                'resultType': 'videos',
 | 
						
						
						
						
							 | 
							
							                'start': (params['pageno'] - 1) * 10,
 | 
						
						
						
						
							 | 
							
							                'count': 10,
 | 
						
						
						
						
							 | 
							
							                # -createdAt: sort by date ascending / createdAt: date descending
 | 
						
						
						
						
							 | 
							
							                'sort': '-match',  # sort by *match descending*
 | 
						
						
						
						
							 | 
							
							                'nsfw': safesearch_table[params['safesearch']],
 | 
						
						
						
						
							 | 
							
							            }
 | 
						
						
						
						
							 | 
							
							        )
 | 
						
						
						
						
							 | 
							
							    )
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							    if eng_lang is not None:
 | 
						
						
						
						
							 | 
							
							        params['url'] += '&languageOneOf[]=' + eng_lang
 | 
						
						
						
						
							 | 
							
							        params['url'] += '&boostLanguages[]=' + eng_lang
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							    if params['time_range'] in time_range_table:
 | 
						
						
						
						
							 | 
							
							        time = datetime.now().date() + time_range_table[params['time_range']]
 | 
						
						
						
						
							 | 
							
							        params['url'] += '&startDate=' + time.isoformat()
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							    return params
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							def response(resp):
 | 
						
						
						
						
							 | 
							
							    return video_response(resp)
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							def video_response(resp):
 | 
						
						
						
						
							 | 
							
							    """Parse video response from SepiaSearch and Peertube instances."""
 | 
						
						
						
						
							 | 
							
							    results = []
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							    json_data = resp.json()
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							    if 'data' not in json_data:
 | 
						
						
						
						
							 | 
							
							        return []
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							    for result in json_data['data']:
 | 
						
						
						
						
							 | 
							
							        metadata = [
 | 
						
						
						
						
							 | 
							
							            x
 | 
						
						
						
						
							 | 
							
							            for x in [
 | 
						
						
						
						
							 | 
							
							                result.get('channel', {}).get('displayName'),
 | 
						
						
						
						
							 | 
							
							                result.get('channel', {}).get('name') + '@' + result.get('channel', {}).get('host'),
 | 
						
						
						
						
							 | 
							
							                ', '.join(result.get('tags', [])),
 | 
						
						
						
						
							 | 
							
							            ]
 | 
						
						
						
						
							 | 
							
							            if x
 | 
						
						
						
						
							 | 
							
							        ]
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							        results.append(
 | 
						
						
						
						
							 | 
							
							            {
 | 
						
						
						
						
							 | 
							
							                'url': result['url'],
 | 
						
						
						
						
							 | 
							
							                'title': result['name'],
 | 
						
						
						
						
							 | 
							
							                'content': html_to_text(result.get('description') or ''),
 | 
						
						
						
						
							 | 
							
							                'author': result.get('account', {}).get('displayName'),
 | 
						
						
						
						
							 | 
							
							                'length': minute_to_hm(result.get('duration')),
 | 
						
						
						
						
							 | 
							
							                'template': 'videos.html',
 | 
						
						
						
						
							 | 
							
							                'publishedDate': parse(result['publishedAt']),
 | 
						
						
						
						
							 | 
							
							                'iframe_src': result.get('embedUrl'),
 | 
						
						
						
						
							 | 
							
							                'thumbnail': result.get('thumbnailUrl') or result.get('previewUrl'),
 | 
						
						
						
						
							 | 
							
							                'metadata': ' | '.join(metadata),
 | 
						
						
						
						
							 | 
							
							            }
 | 
						
						
						
						
							 | 
							
							        )
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							    return results
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							def fetch_traits(engine_traits: EngineTraits):
 | 
						
						
						
						
							 | 
							
							    """Fetch languages from peertube's search-index source code.
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							    See videoLanguages_ in commit `8ed5c729 - Refactor and redesign client`_
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							    .. _8ed5c729 - Refactor and redesign client:
 | 
						
						
						
						
							 | 
							
							       https://framagit.org/framasoft/peertube/search-index/-/commit/8ed5c729
 | 
						
						
						
						
							 | 
							
							    .. _videoLanguages:
 | 
						
						
						
						
							 | 
							
							       https://framagit.org/framasoft/peertube/search-index/-/commit/8ed5c729#3d8747f9a60695c367c70bb64efba8f403721fad_0_291
 | 
						
						
						
						
							 | 
							
							    """
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							    resp = network.get(
 | 
						
						
						
						
							 | 
							
							        'https://framagit.org/framasoft/peertube/search-index/-/raw/master/client/src/components/Filters.vue',
 | 
						
						
						
						
							 | 
							
							        # the response from search-index repository is very slow
 | 
						
						
						
						
							 | 
							
							        timeout=60,
 | 
						
						
						
						
							 | 
							
							    )
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							    if not resp.ok:
 | 
						
						
						
						
							 | 
							
							        print("ERROR: response from peertube is not OK.")
 | 
						
						
						
						
							 | 
							
							        return
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							    js_lang = re.search(r"videoLanguages \(\)[^\n]+(.*?)\]", resp.text, re.DOTALL)
 | 
						
						
						
						
							 | 
							
							    if not js_lang:
 | 
						
						
						
						
							 | 
							
							        print("ERROR: can't determine languages from peertube")
 | 
						
						
						
						
							 | 
							
							        return
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							    for lang in re.finditer(r"\{ id: '([a-z]+)', label:", js_lang.group(1)):
 | 
						
						
						
						
							 | 
							
							        try:
 | 
						
						
						
						
							 | 
							
							            eng_tag = lang.group(1)
 | 
						
						
						
						
							 | 
							
							            if eng_tag == 'oc':
 | 
						
						
						
						
							 | 
							
							                # Occitanis not known by babel, its closest relative is Catalan
 | 
						
						
						
						
							 | 
							
							                # but 'ca' is already in the list of engine_traits.languages -->
 | 
						
						
						
						
							 | 
							
							                # 'oc' will be ignored.
 | 
						
						
						
						
							 | 
							
							                continue
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							            sxng_tag = language_tag(babel.Locale.parse(eng_tag))
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							        except babel.UnknownLocaleError:
 | 
						
						
						
						
							 | 
							
							            print("ERROR: %s is unknown by babel" % eng_tag)
 | 
						
						
						
						
							 | 
							
							            continue
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							        conflict = engine_traits.languages.get(sxng_tag)
 | 
						
						
						
						
							 | 
							
							        if conflict:
 | 
						
						
						
						
							 | 
							
							            if conflict != eng_tag:
 | 
						
						
						
						
							 | 
							
							                print("CONFLICT: babel %s --> %s, %s" % (sxng_tag, conflict, eng_tag))
 | 
						
						
						
						
							 | 
							
							            continue
 | 
						
						
						
						
							 | 
							
							        engine_traits.languages[sxng_tag] = eng_tag
 | 
						
						
						
						
							 | 
							
							
 | 
						
						
						
						
							 | 
							
							    engine_traits.languages['zh_Hans'] = 'zh'
 | 
						
						
						
						
							 | 
							
							    engine_traits.languages['zh_Hant'] = 'zh'
 |