| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178 | 
							- # SPDX-License-Identifier: AGPL-3.0-or-later
 
- """.. sidebar:: info
 
-    - :origin:`elasticsearch.py <searx/engines/elasticsearch.py>`
 
-    - `Elasticsearch <https://www.elastic.co/elasticsearch/>`_
 
-    - `Elasticsearch Guide
 
-      <https://www.elastic.co/guide/en/elasticsearch/reference/current/index.html>`_
 
-    - `Install Elasticsearch
 
-      <https://www.elastic.co/guide/en/elasticsearch/reference/current/install-elasticsearch.html>`_
 
- Elasticsearch_ supports numerous ways to query the data it is storing.  At the
 
- moment the engine supports the most popular search methods (``query_type``):
 
- - ``match``,
 
- - ``simple_query_string``,
 
- - ``term`` and
 
- - ``terms``.
 
- If none of the methods fit your use case, you can select ``custom`` query type
 
- and provide the JSON payload to submit to Elasticsearch in
 
- ``custom_query_json``.
 
- Example
 
- =======
 
- The following is an example configuration for an Elasticsearch_ instance with
 
- authentication configured to read from ``my-index`` index.
 
- .. code:: yaml
 
-   - name: elasticsearch
 
-     shortcut: es
 
-     engine: elasticsearch
 
-     base_url: http://localhost:9200
 
-     username: elastic
 
-     password: changeme
 
-     index: my-index
 
-     query_type: match
 
-     # custom_query_json: '{ ... }'
 
-     enable_http: true
 
- """
 
- from json import loads, dumps
 
- from searx.exceptions import SearxEngineAPIException
 
- base_url = 'http://localhost:9200'
 
- username = ''
 
- password = ''
 
- index = ''
 
- search_url = base_url + '/' + index + '/_search'
 
- query_type = 'match'
 
- custom_query_json = {}
 
- show_metadata = False
 
- categories = ['general']
 
- def init(engine_settings):
 
-     if 'query_type' in engine_settings and engine_settings['query_type'] not in _available_query_types:
 
-         raise ValueError('unsupported query type', engine_settings['query_type'])
 
-     if index == '':
 
-         raise ValueError('index cannot be empty')
 
- def request(query, params):
 
-     if query_type not in _available_query_types:
 
-         return params
 
-     if username and password:
 
-         params['auth'] = (username, password)
 
-     params['url'] = search_url
 
-     params['method'] = 'GET'
 
-     params['data'] = dumps(_available_query_types[query_type](query))
 
-     params['headers']['Content-Type'] = 'application/json'
 
-     return params
 
- def _match_query(query):
 
-     """
 
-     The standard for full text queries.
 
-     searx format: "key:value" e.g. city:berlin
 
-     REF: https://www.elastic.co/guide/en/elasticsearch/reference/current/query-dsl-match-query.html
 
-     """
 
-     try:
 
-         key, value = query.split(':')
 
-     except Exception as e:
 
-         raise ValueError('query format must be "key:value"') from e
 
-     return {"query": {"match": {key: {'query': value}}}}
 
- def _simple_query_string_query(query):
 
-     """
 
-     Accepts query strings, but it is less strict than query_string
 
-     The field used can be specified in index.query.default_field in Elasticsearch.
 
-     REF: https://www.elastic.co/guide/en/elasticsearch/reference/current/query-dsl-simple-query-string-query.html
 
-     """
 
-     return {'query': {'simple_query_string': {'query': query}}}
 
- def _term_query(query):
 
-     """
 
-     Accepts one term and the name of the field.
 
-     searx format: "key:value" e.g. city:berlin
 
-     REF: https://www.elastic.co/guide/en/elasticsearch/reference/current/query-dsl-term-query.html
 
-     """
 
-     try:
 
-         key, value = query.split(':')
 
-     except Exception as e:
 
-         raise ValueError('query format must be key:value') from e
 
-     return {'query': {'term': {key: value}}}
 
- def _terms_query(query):
 
-     """
 
-     Accepts multiple terms and the name of the field.
 
-     searx format: "key:value1,value2" e.g. city:berlin,paris
 
-     REF: https://www.elastic.co/guide/en/elasticsearch/reference/current/query-dsl-terms-query.html
 
-     """
 
-     try:
 
-         key, values = query.split(':')
 
-     except Exception as e:
 
-         raise ValueError('query format must be key:value1,value2') from e
 
-     return {'query': {'terms': {key: values.split(',')}}}
 
- def _custom_query(query):
 
-     key, value = query.split(':')
 
-     custom_query = custom_query_json
 
-     for query_key, query_value in custom_query.items():
 
-         if query_key == '{{KEY}}':
 
-             custom_query[key] = custom_query.pop(query_key)
 
-         if query_value == '{{VALUE}}':
 
-             custom_query[query_key] = value
 
-     return custom_query
 
- def response(resp):
 
-     results = []
 
-     resp_json = loads(resp.text)
 
-     if 'error' in resp_json:
 
-         raise SearxEngineAPIException(resp_json['error'])
 
-     for result in resp_json['hits']['hits']:
 
-         r = {key: str(value) if not key.startswith('_') else value for key, value in result['_source'].items()}
 
-         r['template'] = 'key-value.html'
 
-         if show_metadata:
 
-             r['metadata'] = {'index': result['_index'], 'id': result['_id'], 'score': result['_score']}
 
-         results.append(r)
 
-     return results
 
- _available_query_types = {
 
-     # Full text queries
 
-     # https://www.elastic.co/guide/en/elasticsearch/reference/current/full-text-queries.html
 
-     'match': _match_query,
 
-     'simple_query_string': _simple_query_string_query,
 
-     # Term-level queries
 
-     # https://www.elastic.co/guide/en/elasticsearch/reference/current/term-level-queries.html
 
-     'term': _term_query,
 
-     'terms': _terms_query,
 
-     # Query JSON defined by the instance administrator.
 
-     'custom': _custom_query,
 
- }
 
 
  |