| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171 | # SPDX-License-Identifier: AGPL-3.0-or-later# lint: pylint# pylint: disable=missing-module-docstring# pyright: basicimport jsonimport timeimport threadingimport osimport signalfrom typing import Dict, Union, List, Any, Tuple, Optionalfrom typing_extensions import TypedDict, Literalimport redis.exceptionsfrom searx import logger, settings, searx_debugfrom searx.shared.redisdb import client as get_redis_clientfrom searx.exceptions import SearxSettingsExceptionfrom searx.search.processors import PROCESSORSfrom searx.search.checker import Checkerfrom searx.search.checker.scheduler import scheduler_functionREDIS_RESULT_KEY = 'SearXNG_checker_result'REDIS_LOCK_KEY = 'SearXNG_checker_lock'CheckerResult = Union['CheckerOk', 'CheckerErr', 'CheckerOther']class CheckerOk(TypedDict):    """Checking the engines succeeded"""    status: Literal['ok']    engines: Dict[str, 'EngineResult']    timestamp: intclass CheckerErr(TypedDict):    """Checking the engines failed"""    status: Literal['error']    timestamp: intclass CheckerOther(TypedDict):    """The status is unknown or disabled"""    status: Literal['unknown', 'disabled']EngineResult = Union['EngineOk', 'EngineErr']class EngineOk(TypedDict):    """Checking the engine succeeded"""    success: Literal[True]class EngineErr(TypedDict):    """Checking the engine failed"""    success: Literal[False]    errors: Dict[str, List[str]]def _get_interval(every: Any, error_msg: str) -> Tuple[int, int]:    if isinstance(every, int):        return (every, every)    if (        not isinstance(every, (tuple, list))        or len(every) != 2  # type: ignore        or not isinstance(every[0], int)        or not isinstance(every[1], int)    ):        raise SearxSettingsException(error_msg, None)    return (every[0], every[1])def get_result() -> CheckerResult:    client = get_redis_client()    if client is None:        # without Redis, the checker is disabled        return {'status': 'disabled'}    serialized_result: Optional[bytes] = client.get(REDIS_RESULT_KEY)    if serialized_result is None:        # the Redis key does not exist        return {'status': 'unknown'}    return json.loads(serialized_result)def _set_result(result: CheckerResult):    client = get_redis_client()    if client is None:        # without Redis, the function does nothing        return    client.set(REDIS_RESULT_KEY, json.dumps(result))def _timestamp():    return int(time.time() / 3600) * 3600def run():    try:        # use a Redis lock to make sure there is no checker running at the same time        # (this should not happen, this is a safety measure)        with get_redis_client().lock(REDIS_LOCK_KEY, blocking_timeout=60, timeout=3600):            logger.info('Starting checker')            result: CheckerOk = {'status': 'ok', 'engines': {}, 'timestamp': _timestamp()}            for name, processor in PROCESSORS.items():                logger.debug('Checking %s engine', name)                checker = Checker(processor)                checker.run()                if checker.test_results.successful:                    result['engines'][name] = {'success': True}                else:                    result['engines'][name] = {'success': False, 'errors': checker.test_results.errors}            _set_result(result)            logger.info('Check done')    except redis.exceptions.LockError:        _set_result({'status': 'error', 'timestamp': _timestamp()})        logger.exception('Error while running the checker')    except Exception:  # pylint: disable=broad-except        _set_result({'status': 'error', 'timestamp': _timestamp()})        logger.exception('Error while running the checker')def _signal_handler(_signum: int, _frame: Any):    t = threading.Thread(target=run)    t.daemon = True    t.start()def initialize():    if hasattr(signal, 'SIGUSR1'):        # Windows doesn't support SIGUSR1        logger.info('Send SIGUSR1 signal to pid %i to start the checker', os.getpid())        signal.signal(signal.SIGUSR1, _signal_handler)    # special case when debug is activate    if searx_debug and settings['checker']['off_when_debug']:        logger.info('debug mode: checker is disabled')        return    # check value of checker.scheduling.every now    scheduling = settings['checker']['scheduling']    if scheduling is None or not scheduling:        logger.info('Checker scheduler is disabled')        return    # make sure there is a Redis connection    if get_redis_client() is None:        logger.error('The checker requires Redis')        return    # start the background scheduler    every_range = _get_interval(scheduling.get('every', (300, 1800)), 'checker.scheduling.every is not a int or list')    start_after_range = _get_interval(        scheduling.get('start_after', (300, 1800)), 'checker.scheduling.start_after is not a int or list'    )    t = threading.Thread(        target=scheduler_function,        args=(start_after_range[0], start_after_range[1], every_range[0], every_range[1], run),        name='checker_scheduler',    )    t.daemon = True    t.start()
 |