123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171 |
- # SPDX-License-Identifier: AGPL-3.0-or-later
- # lint: pylint
- # pylint: disable=missing-module-docstring
- # pyright: basic
- import json
- import time
- import threading
- import os
- import signal
- from typing import Dict, Union, List, Any, Tuple, Optional
- from typing_extensions import TypedDict, Literal
- import redis.exceptions
- from searx import logger, settings, searx_debug
- from searx.redisdb import client as get_redis_client
- from searx.exceptions import SearxSettingsException
- from searx.search.processors import PROCESSORS
- from searx.search.checker import Checker
- from searx.search.checker.scheduler import scheduler_function
- REDIS_RESULT_KEY = 'SearXNG_checker_result'
- REDIS_LOCK_KEY = 'SearXNG_checker_lock'
- CheckerResult = Union['CheckerOk', 'CheckerErr', 'CheckerOther']
- class CheckerOk(TypedDict):
- """Checking the engines succeeded"""
- status: Literal['ok']
- engines: Dict[str, 'EngineResult']
- timestamp: int
- class CheckerErr(TypedDict):
- """Checking the engines failed"""
- status: Literal['error']
- timestamp: int
- class CheckerOther(TypedDict):
- """The status is unknown or disabled"""
- status: Literal['unknown', 'disabled']
- EngineResult = Union['EngineOk', 'EngineErr']
- class EngineOk(TypedDict):
- """Checking the engine succeeded"""
- success: Literal[True]
- class EngineErr(TypedDict):
- """Checking the engine failed"""
- success: Literal[False]
- errors: Dict[str, List[str]]
- def _get_interval(every: Any, error_msg: str) -> Tuple[int, int]:
- if isinstance(every, int):
- return (every, every)
- if (
- not isinstance(every, (tuple, list))
- or len(every) != 2 # type: ignore
- or not isinstance(every[0], int)
- or not isinstance(every[1], int)
- ):
- raise SearxSettingsException(error_msg, None)
- return (every[0], every[1])
- def get_result() -> CheckerResult:
- client = get_redis_client()
- if client is None:
- # without Redis, the checker is disabled
- return {'status': 'disabled'}
- serialized_result: Optional[bytes] = client.get(REDIS_RESULT_KEY)
- if serialized_result is None:
- # the Redis key does not exist
- return {'status': 'unknown'}
- return json.loads(serialized_result)
- def _set_result(result: CheckerResult):
- client = get_redis_client()
- if client is None:
- # without Redis, the function does nothing
- return
- client.set(REDIS_RESULT_KEY, json.dumps(result))
- def _timestamp():
- return int(time.time() / 3600) * 3600
- def run():
- try:
- # use a Redis lock to make sure there is no checker running at the same time
- # (this should not happen, this is a safety measure)
- with get_redis_client().lock(REDIS_LOCK_KEY, blocking_timeout=60, timeout=3600):
- logger.info('Starting checker')
- result: CheckerOk = {'status': 'ok', 'engines': {}, 'timestamp': _timestamp()}
- for name, processor in PROCESSORS.items():
- logger.debug('Checking %s engine', name)
- checker = Checker(processor)
- checker.run()
- if checker.test_results.successful:
- result['engines'][name] = {'success': True}
- else:
- result['engines'][name] = {'success': False, 'errors': checker.test_results.errors}
- _set_result(result)
- logger.info('Check done')
- except redis.exceptions.LockError:
- _set_result({'status': 'error', 'timestamp': _timestamp()})
- logger.exception('Error while running the checker')
- except Exception: # pylint: disable=broad-except
- _set_result({'status': 'error', 'timestamp': _timestamp()})
- logger.exception('Error while running the checker')
- def _signal_handler(_signum: int, _frame: Any):
- t = threading.Thread(target=run)
- t.daemon = True
- t.start()
- def initialize():
- if hasattr(signal, 'SIGUSR1'):
- # Windows doesn't support SIGUSR1
- logger.info('Send SIGUSR1 signal to pid %i to start the checker', os.getpid())
- signal.signal(signal.SIGUSR1, _signal_handler)
- # special case when debug is activate
- if searx_debug and settings['checker']['off_when_debug']:
- logger.info('debug mode: checker is disabled')
- return
- # check value of checker.scheduling.every now
- scheduling = settings['checker']['scheduling']
- if scheduling is None or not scheduling:
- logger.info('Checker scheduler is disabled')
- return
- # make sure there is a Redis connection
- if get_redis_client() is None:
- logger.error('The checker requires Redis')
- return
- # start the background scheduler
- every_range = _get_interval(scheduling.get('every', (300, 1800)), 'checker.scheduling.every is not a int or list')
- start_after_range = _get_interval(
- scheduling.get('start_after', (300, 1800)), 'checker.scheduling.start_after is not a int or list'
- )
- t = threading.Thread(
- target=scheduler_function,
- args=(start_after_range[0], start_after_range[1], every_range[0], every_range[1], run),
- name='checker_scheduler',
- )
- t.daemon = True
- t.start()
|