| 1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798 | # SPDX-License-Identifier: AGPL-3.0-or-later# lint: pylint"""Bing (Videos)"""from json import loadsfrom urllib.parse import urlencodefrom lxml import htmlfrom searx.utils import match_languagefrom searx.engines.bing import language_aliasesfrom searx.engines.bing import (  # pylint: disable=unused-import    _fetch_supported_languages,    supported_languages_url,)about = {    "website": 'https://www.bing.com/videos',    "wikidata_id": 'Q4914152',    "official_api_documentation": 'https://www.microsoft.com/en-us/bing/apis/bing-video-search-api',    "use_official_api": False,    "require_api_key": False,    "results": 'HTML',}categories = ['videos', 'web']paging = Truesafesearch = Truetime_range_support = Truesend_accept_language_header = Truenumber_of_results = 28base_url = 'https://www.bing.com/'search_string = (    # fmt: off    'videos/search'    '?{query}'    '&count={count}'    '&first={first}'    '&scope=video'    '&FORM=QBLH'    # fmt: on)time_range_string = '&qft=+filterui:videoage-lt{interval}'time_range_dict = {'day': '1440', 'week': '10080', 'month': '43200', 'year': '525600'}# safesearch definitionssafesearch_types = {2: 'STRICT', 1: 'DEMOTE', 0: 'OFF'}# do search-requestdef request(query, params):    offset = ((params['pageno'] - 1) * number_of_results) + 1    search_path = search_string.format(query=urlencode({'q': query}), count=number_of_results, first=offset)    # safesearch cookie    params['cookies']['SRCHHPGUSR'] = 'ADLT=' + safesearch_types.get(params['safesearch'], 'DEMOTE')    # language cookie    language = match_language(params['language'], supported_languages, language_aliases).lower()    params['cookies']['_EDGE_S'] = 'mkt=' + language + '&F=1'    # query and paging    params['url'] = base_url + search_path    # time range    if params['time_range'] in time_range_dict:        params['url'] += time_range_string.format(interval=time_range_dict[params['time_range']])    return params# get response from search-requestdef response(resp):    results = []    dom = html.fromstring(resp.text)    for result in dom.xpath('//div[@class="dg_u"]/div[contains(@class, "mc_vtvc")]'):        metadata = loads(result.xpath('.//div[@class="vrhdata"]/@vrhm')[0])        info = ' - '.join(result.xpath('.//div[@class="mc_vtvc_meta_block"]//span/text()')).strip()        content = '{0} - {1}'.format(metadata['du'], info)        thumbnail = '{0}th?id={1}'.format(base_url, metadata['thid'])        results.append(            {                'url': metadata['murl'],                'thumbnail': thumbnail,                'title': metadata.get('vt', ''),                'content': content,                'template': 'videos.html',            }        )    return results
 |