| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687 | # SPDX-License-Identifier: AGPL-3.0-or-later""" Doku Wiki"""from urllib.parse import urlencodefrom lxml.html import fromstringfrom searx.utils import extract_text, eval_xpath# aboutabout = {    "website": 'https://www.dokuwiki.org/',    "wikidata_id": 'Q851864',    "official_api_documentation": 'https://www.dokuwiki.org/devel:xmlrpc',    "use_official_api": False,    "require_api_key": False,    "results": 'HTML',}# engine dependent configcategories = ['general']  # TODO , 'images', 'music', 'videos', 'files'paging = Falsenumber_of_results = 5# search-url# Doku is OpenSearch compatiblebase_url = 'http://localhost:8090'search_url = '/?do=search'\             '&{query}'# TODO             '&startRecord={offset}'\# TODO             '&maximumRecords={limit}'\# do search-requestdef request(query, params):    params['url'] = base_url +\        search_url.format(query=urlencode({'id': query}))    return params# get response from search-requestdef response(resp):    results = []    doc = fromstring(resp.text)    # parse results    # Quickhits    for r in eval_xpath(doc, '//div[@class="search_quickresult"]/ul/li'):        try:            res_url = eval_xpath(r, './/a[@class="wikilink1"]/@href')[-1]        except:            continue        if not res_url:            continue        title = extract_text(eval_xpath(r, './/a[@class="wikilink1"]/@title'))        # append result        results.append({'title': title,                        'content': "",                        'url': base_url + res_url})    # Search results    for r in eval_xpath(doc, '//dl[@class="search_results"]/*'):        try:            if r.tag == "dt":                res_url = eval_xpath(r, './/a[@class="wikilink1"]/@href')[-1]                title = extract_text(eval_xpath(r, './/a[@class="wikilink1"]/@title'))            elif r.tag == "dd":                content = extract_text(eval_xpath(r, '.'))                # append result                results.append({'title': title,                                'content': content,                                'url': base_url + res_url})        except:            continue        if not res_url:            continue    # return results    return results
 |