elasticsearch.py 4.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146
  1. # SPDX-License-Identifier: AGPL-3.0-or-later
  2. """
  3. Elasticsearch
  4. """
  5. from json import loads, dumps
  6. from requests.auth import HTTPBasicAuth
  7. from searx.exceptions import SearxEngineAPIException
  8. base_url = 'http://localhost:9200'
  9. username = ''
  10. password = ''
  11. index = ''
  12. search_url = base_url + '/' + index + '/_search'
  13. query_type = 'match'
  14. custom_query_json = {}
  15. show_metadata = False
  16. categories = ['general']
  17. def init(engine_settings):
  18. if 'query_type' in engine_settings and engine_settings['query_type'] not in _available_query_types:
  19. raise ValueError('unsupported query type', engine_settings['query_type'])
  20. if index == '':
  21. raise ValueError('index cannot be empty')
  22. def request(query, params):
  23. if query_type not in _available_query_types:
  24. return params
  25. if username and password:
  26. params['auth'] = HTTPBasicAuth(username, password)
  27. params['url'] = search_url
  28. params['method'] = 'GET'
  29. params['data'] = dumps(_available_query_types[query_type](query))
  30. params['headers']['Content-Type'] = 'application/json'
  31. return params
  32. def _match_query(query):
  33. """
  34. The standard for full text queries.
  35. searx format: "key:value" e.g. city:berlin
  36. REF: https://www.elastic.co/guide/en/elasticsearch/reference/current/query-dsl-match-query.html
  37. """
  38. try:
  39. key, value = query.split(':')
  40. except Exception as e:
  41. raise ValueError('query format must be "key:value"') from e
  42. return {"query": {"match": {key: {'query': value}}}}
  43. def _simple_query_string_query(query):
  44. """
  45. Accepts query strings, but it is less strict than query_string
  46. The field used can be specified in index.query.default_field in Elasticsearch.
  47. REF: https://www.elastic.co/guide/en/elasticsearch/reference/current/query-dsl-simple-query-string-query.html
  48. """
  49. return {'query': {'simple_query_string': {'query': query}}}
  50. def _term_query(query):
  51. """
  52. Accepts one term and the name of the field.
  53. searx format: "key:value" e.g. city:berlin
  54. REF: https://www.elastic.co/guide/en/elasticsearch/reference/current/query-dsl-term-query.html
  55. """
  56. try:
  57. key, value = query.split(':')
  58. except Exception as e:
  59. raise ValueError('query format must be key:value') from e
  60. return {'query': {'term': {key: value}}}
  61. def _terms_query(query):
  62. """
  63. Accepts multiple terms and the name of the field.
  64. searx format: "key:value1,value2" e.g. city:berlin,paris
  65. REF: https://www.elastic.co/guide/en/elasticsearch/reference/current/query-dsl-terms-query.html
  66. """
  67. try:
  68. key, values = query.split(':')
  69. except Exception as e:
  70. raise ValueError('query format must be key:value1,value2') from e
  71. return {'query': {'terms': {key: values.split(',')}}}
  72. def _custom_query(query):
  73. key, value = query.split(':')
  74. custom_query = custom_query_json
  75. for query_key, query_value in custom_query.items():
  76. if query_key == '{{KEY}}':
  77. custom_query[key] = custom_query.pop(query_key)
  78. if query_value == '{{VALUE}}':
  79. custom_query[query_key] = value
  80. return custom_query
  81. def response(resp):
  82. results = []
  83. resp_json = loads(resp.text)
  84. if 'error' in resp_json:
  85. raise SearxEngineAPIException(resp_json['error'])
  86. for result in resp_json['hits']['hits']:
  87. r = {key: str(value) if not key.startswith('_') else value for key, value in result['_source'].items()}
  88. r['template'] = 'key-value.html'
  89. if show_metadata:
  90. r['metadata'] = {'index': result['_index'],
  91. 'id': result['_id'],
  92. 'score': result['_score']}
  93. results.append(r)
  94. return results
  95. _available_query_types = {
  96. # Full text queries
  97. # https://www.elastic.co/guide/en/elasticsearch/reference/current/full-text-queries.html
  98. 'match': _match_query,
  99. 'simple_query_string': _simple_query_string_query,
  100. # Term-level queries
  101. # https://www.elastic.co/guide/en/elasticsearch/reference/current/term-level-queries.html
  102. 'term': _term_query,
  103. 'terms': _terms_query,
  104. # Query JSON defined by the instance administrator.
  105. 'custom': _custom_query,
  106. }