.oO SearXNG Developer Documentation Oo.
Loading...
Searching...
No Matches
elasticsearch.py
Go to the documentation of this file.
1# SPDX-License-Identifier: AGPL-3.0-or-later
2""".. sidebar:: info
3
4 - :origin:`elasticsearch.py <searx/engines/elasticsearch.py>`
5 - `Elasticsearch <https://www.elastic.co/elasticsearch/>`_
6 - `Elasticsearch Guide
7 <https://www.elastic.co/guide/en/elasticsearch/reference/current/index.html>`_
8 - `Install Elasticsearch
9 <https://www.elastic.co/guide/en/elasticsearch/reference/current/install-elasticsearch.html>`_
10
11Elasticsearch_ supports numerous ways to query the data it is storing. At the
12moment the engine supports the most popular search methods (``query_type``):
13
14- ``match``,
15- ``simple_query_string``,
16- ``term`` and
17- ``terms``.
18
19If none of the methods fit your use case, you can select ``custom`` query type
20and provide the JSON payload to submit to Elasticsearch in
21``custom_query_json``.
22
23Example
24=======
25
26The following is an example configuration for an Elasticsearch_ instance with
27authentication configured to read from ``my-index`` index.
28
29.. code:: yaml
30
31 - name: elasticsearch
32 shortcut: els
33 engine: elasticsearch
34 base_url: http://localhost:9200
35 username: elastic
36 password: changeme
37 index: my-index
38 query_type: match
39 # custom_query_json: '{ ... }'
40 enable_http: true
41
42"""
43
44from json import loads, dumps
45from searx.exceptions import SearxEngineAPIException
46from searx.result_types import EngineResults
47from searx.extended_types import SXNG_Response
48
49categories = ['general']
50paging = True
51
52about = {
53 'website': 'https://www.elastic.co',
54 'wikidata_id': 'Q3050461',
55 'official_api_documentation': 'https://www.elastic.co/guide/en/elasticsearch/reference/current/search-search.html',
56 'use_official_api': True,
57 'require_api_key': False,
58 'format': 'JSON',
59}
60
61base_url = 'http://localhost:9200'
62username = ''
63password = ''
64index = ''
65query_type = 'match'
66custom_query_json = {}
67show_metadata = False
68page_size = 10
69
70
71def init(engine_settings):
72 if 'query_type' in engine_settings and engine_settings['query_type'] not in _available_query_types:
73 raise ValueError('unsupported query type', engine_settings['query_type'])
74
75 if index == '':
76 raise ValueError('index cannot be empty')
77
78
79def request(query, params):
80 if query_type not in _available_query_types:
81 return params
82
83 if username and password:
84 params['auth'] = (username, password)
85
86 args = {
87 'from': (params['pageno'] - 1) * page_size,
88 'size': page_size,
89 }
90 data = _available_query_types[query_type](query)
91 data.update(args)
92
93 params['url'] = f"{base_url}/{index}/_search"
94 params['method'] = 'GET'
95 params['data'] = dumps(data)
96 params['headers']['Content-Type'] = 'application/json'
97
98 return params
99
100
101def _match_query(query):
102 """
103 The standard for full text queries.
104 searx format: "key:value" e.g. city:berlin
105 REF: https://www.elastic.co/guide/en/elasticsearch/reference/current/query-dsl-match-query.html
106 """
107
108 try:
109 key, value = query.split(':')
110 except Exception as e:
111 raise ValueError('query format must be "key:value"') from e
112
113 return {"query": {"match": {key: {'query': value}}}}
114
115
117 """
118 Accepts query strings, but it is less strict than query_string
119 The field used can be specified in index.query.default_field in Elasticsearch.
120 REF: https://www.elastic.co/guide/en/elasticsearch/reference/current/query-dsl-simple-query-string-query.html
121 """
122
123 return {'query': {'simple_query_string': {'query': query}}}
124
125
126def _term_query(query):
127 """
128 Accepts one term and the name of the field.
129 searx format: "key:value" e.g. city:berlin
130 REF: https://www.elastic.co/guide/en/elasticsearch/reference/current/query-dsl-term-query.html
131 """
132
133 try:
134 key, value = query.split(':')
135 except Exception as e:
136 raise ValueError('query format must be key:value') from e
137
138 return {'query': {'term': {key: value}}}
139
140
141def _terms_query(query):
142 """
143 Accepts multiple terms and the name of the field.
144 searx format: "key:value1,value2" e.g. city:berlin,paris
145 REF: https://www.elastic.co/guide/en/elasticsearch/reference/current/query-dsl-terms-query.html
146 """
147
148 try:
149 key, values = query.split(':')
150 except Exception as e:
151 raise ValueError('query format must be key:value1,value2') from e
152
153 return {'query': {'terms': {key: values.split(',')}}}
154
155
156def _custom_query(query):
157 key, value = query.split(':')
158 custom_query = custom_query_json
159 for query_key, query_value in custom_query.items():
160 if query_key == '{{KEY}}':
161 custom_query[key] = custom_query.pop(query_key)
162 if query_value == '{{VALUE}}':
163 custom_query[query_key] = value
164 return custom_query
165
166
167def response(resp: SXNG_Response) -> EngineResults:
168 res = EngineResults()
169
170 resp_json = loads(resp.text)
171 if 'error' in resp_json:
172 raise SearxEngineAPIException(resp_json["error"])
173
174 for result in resp_json["hits"]["hits"]:
175 kvmap = {key: str(value) if not key.startswith("_") else value for key, value in result["_source"].items()}
176 if show_metadata:
177 kvmap["metadata"] = {"index": result["_index"], "id": result["_id"], "score": result["_score"]}
178 res.add(res.types.KeyValue(kvmap=kvmap))
179
180 return res
181
182
183_available_query_types = {
184 # Full text queries
185 # https://www.elastic.co/guide/en/elasticsearch/reference/current/full-text-queries.html
186 'match': _match_query,
187 'simple_query_string': _simple_query_string_query,
188 # Term-level queries
189 # https://www.elastic.co/guide/en/elasticsearch/reference/current/term-level-queries.html
190 'term': _term_query,
191 'terms': _terms_query,
192 # Query JSON defined by the instance administrator.
193 'custom': _custom_query,
194}
EngineResults response(SXNG_Response resp)