| 1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980 | #!/usr/bin/env python# SPDX-License-Identifier: AGPL-3.0-or-later"""Fetch firefox useragent signaturesOutput file: :origin:`searx/data/useragents.json` (:origin:`CI Update data ...<.github/workflows/data-update.yml>`)."""# pylint: disable=use-dict-literalimport jsonimport refrom urllib.parse import urlparse, urljoinfrom packaging.version import parseimport requestsfrom lxml import htmlfrom searx.data import data_dirDATA_FILE = data_dir / 'useragents.json'URL = 'https://ftp.mozilla.org/pub/firefox/releases/'RELEASE_PATH = '/pub/firefox/releases/'NORMAL_REGEX = re.compile(r'^[0-9]+\.[0-9](\.[0-9])?$')# BETA_REGEX = re.compile(r'.*[0-9]b([0-9\-a-z]+)$')# ESR_REGEX = re.compile(r'^[0-9]+\.[0-9](\.[0-9])?esr$')#useragents = {    # fmt: off    "versions": (),    "os": ('Windows NT 10.0; Win64; x64',           'X11; Linux x86_64'),    "ua": "Mozilla/5.0 ({os}; rv:{version}) Gecko/20100101 Firefox/{version}",    # fmt: on}def fetch_firefox_versions():    resp = requests.get(URL, timeout=2.0)    if resp.status_code != 200:        # pylint: disable=broad-exception-raised        raise Exception("Error fetching firefox versions, HTTP code " + resp.status_code)  # type: ignore    dom = html.fromstring(resp.text)    versions = []    for link in dom.xpath('//a/@href'):        url = urlparse(urljoin(URL, link))        path = url.path        if path.startswith(RELEASE_PATH):            version = path[len(RELEASE_PATH) : -1]            if NORMAL_REGEX.match(version):                versions.append(parse(version))    list.sort(versions, reverse=True)    return versionsdef fetch_firefox_last_versions():    versions = fetch_firefox_versions()    result = []    major_last = versions[0].major    major_list = (major_last, major_last - 1)    for version in versions:        major_current = version.major        minor_current = version.minor        if major_current in major_list:            user_agent_version = f'{major_current}.{minor_current}'            if user_agent_version not in result:                result.append(user_agent_version)    return resultif __name__ == '__main__':    useragents["versions"] = fetch_firefox_last_versions()    with DATA_FILE.open('w', encoding='utf-8') as f:        json.dump(useragents, f, indent=4, sort_keys=True, ensure_ascii=False)
 |