.oO SearXNG Developer Documentation Oo.
Loading...
Searching...
No Matches
unit_converter.py
Go to the documentation of this file.
1# SPDX-License-Identifier: AGPL-3.0-or-later
2"""A plugin for converting measured values from one unit to another unit (a
3unit converter).
4
5The plugin looks up the symbols (given in the query term) in a list of
6converters, each converter is one item in the list (compare
7:py:obj:`ADDITIONAL_UNITS`). If the symbols are ambiguous, the matching units
8of measurement are evaluated. The weighting in the evaluation results from the
9sorting of the :py:obj:`list of unit converters<symbol_to_si>`.
10"""
11from __future__ import annotations
12import typing
13import re
14import babel.numbers
15
16from flask_babel import gettext, get_locale
17
18from searx import data
19from searx.plugins import Plugin, PluginInfo
20from searx.result_types import EngineResults
21
22if typing.TYPE_CHECKING:
23 from searx.search import SearchWithPlugins
24 from searx.extended_types import SXNG_Request
25 from searx.plugins import PluginCfg
26
27
28name = ""
29description = gettext("")
30
31plugin_id = ""
32preference_section = ""
33
34CONVERT_KEYWORDS = ["in", "to", "as"]
35
36
38 """Convert between units. The result is displayed in area for the
39 "answers".
40 """
41
42 id = "unit_converter"
43
44 def __init__(self, plg_cfg: "PluginCfg") -> None:
45 super().__init__(plg_cfg)
46
48 id=self.id,
49 name=gettext("Unit converter plugin"),
50 description=gettext("Convert between units"),
51 preference_section="general",
52 )
53
54 def post_search(self, request: "SXNG_Request", search: "SearchWithPlugins") -> EngineResults:
55 results = EngineResults()
56
57 # only convert between units on the first page
58 if search.search_query.pageno > 1:
59 return results
60
61 query = search.search_query.query
62 query_parts = query.split(" ")
63
64 if len(query_parts) < 3:
65 return results
66
67 for query_part in query_parts:
68 for keyword in CONVERT_KEYWORDS:
69 if query_part == keyword:
70 from_query, to_query = query.split(keyword, 1)
71 target_val = _parse_text_and_convert(from_query.strip(), to_query.strip())
72 if target_val:
73 results.add(results.types.Answer(answer=target_val))
74
75 return results
76
77
78# inspired from https://stackoverflow.com/a/42475086
79RE_MEASURE = r'''
80(?P<sign>[-+]?) # +/- or nothing for positive
81(\s*) # separator: white space or nothing
82(?P<number>[\d\.,]*) # number: 1,000.00 (en) or 1.000,00 (de)
83(?P<E>[eE][-+]?\d+)? # scientific notation: e(+/-)2 (*10^2)
84(\s*) # separator: white space or nothing
85(?P<unit>\S+) # unit of measure
86'''
87
88
89ADDITIONAL_UNITS = [
90 {
91 "si_name": "Q11579",
92 "symbol": "°C",
93 "to_si": lambda val: val + 273.15,
94 "from_si": lambda val: val - 273.15,
95 },
96 {
97 "si_name": "Q11579",
98 "symbol": "°F",
99 "to_si": lambda val: (val + 459.67) * 5 / 9,
100 "from_si": lambda val: (val * 9 / 5) - 459.67,
101 },
102]
103"""Additional items to convert from a measure unit to a SI unit (vice versa).
104
105.. code:: python
106
107 {
108 "si_name": "Q11579", # Wikidata item ID of the SI unit (Kelvin)
109 "symbol": "°C", # symbol of the measure unit
110 "to_si": lambda val: val + 273.15, # convert measure value (val) to SI unit
111 "from_si": lambda val: val - 273.15, # convert SI value (val) measure unit
112 },
113 {
114 "si_name": "Q11573",
115 "symbol": "mi",
116 "to_si": 1609.344, # convert measure value (val) to SI unit
117 "from_si": 1 / 1609.344 # convert SI value (val) measure unit
118 },
119
120The values of ``to_si`` and ``from_si`` can be of :py:obj:`float` (a multiplier)
121or a callable_ (val in / converted value returned).
122
123.. _callable: https://docs.python.org/3/glossary.html#term-callable
124"""
125
126
127ALIAS_SYMBOLS = {
128 '°C': ('C',),
129 '°F': ('F',),
130 'mi': ('L',),
131}
132"""Alias symbols for known unit of measure symbols / by example::
133
134 '°C': ('C', ...), # list of alias symbols for °C (Q69362731)
135 '°F': ('F', ...), # list of alias symbols for °F (Q99490479)
136 'mi': ('L',), # list of alias symbols for mi (Q253276)
137"""
138
139
140SYMBOL_TO_SI = []
141
142
144 """Generates a list of tuples, each tuple is a measure unit and the fields
145 in the tuple are:
146
147 0. Symbol of the measure unit (e.g. 'mi' for measure unit 'miles' Q253276)
148
149 1. SI name of the measure unit (e.g. Q11573 for SI unit 'metre')
150
151 2. Factor to get SI value from measure unit (e.g. 1mi is equal to SI 1m
152 multiplied by 1609.344)
153
154 3. Factor to get measure value from from SI value (e.g. SI 100m is equal to
155 100mi divided by 1609.344)
156
157 The returned list is sorted, the first items are created from
158 ``WIKIDATA_UNITS``, the second group of items is build from
159 :py:obj:`ADDITIONAL_UNITS` and items created from :py:obj:`ALIAS_SYMBOLS`.
160
161 If you search this list for a symbol, then a match with a symbol from
162 Wikidata has the highest weighting (first hit in the list), followed by the
163 symbols from the :py:obj:`ADDITIONAL_UNITS` and the lowest weighting is
164 given to the symbols resulting from the aliases :py:obj:`ALIAS_SYMBOLS`.
165
166 """
167
168 global SYMBOL_TO_SI # pylint: disable=global-statement
169 if SYMBOL_TO_SI:
170 return SYMBOL_TO_SI
171
172 # filter out units which can't be normalized to a SI unit and filter out
173 # units without a symbol / arcsecond does not have a symbol
174 # https://www.wikidata.org/wiki/Q829073
175
176 for item in data.WIKIDATA_UNITS.values():
177 if item['to_si_factor'] and item['symbol']:
178 SYMBOL_TO_SI.append(
179 (
180 item['symbol'],
181 item['si_name'],
182 1 / item['to_si_factor'], # from_si
183 item['to_si_factor'], # to_si
184 item['symbol'],
185 )
186 )
187
188 for item in ADDITIONAL_UNITS:
189 SYMBOL_TO_SI.append(
190 (
191 item['symbol'],
192 item['si_name'],
193 item['from_si'],
194 item['to_si'],
195 item['symbol'],
196 )
197 )
198
199 alias_items = []
200 for item in SYMBOL_TO_SI:
201 for alias in ALIAS_SYMBOLS.get(item[0], ()):
202 alias_items.append(
203 (
204 alias,
205 item[1],
206 item[2], # from_si
207 item[3], # to_si
208 item[0], # origin unit
209 )
210 )
211 SYMBOL_TO_SI = SYMBOL_TO_SI + alias_items
212 return SYMBOL_TO_SI
213
214
215def _parse_text_and_convert(from_query, to_query) -> str | None:
216
217 # pylint: disable=too-many-branches, too-many-locals
218
219 if not (from_query and to_query):
220 return None
221
222 measured = re.match(RE_MEASURE, from_query, re.VERBOSE)
223 if not (measured and measured.group('number'), measured.group('unit')):
224 return None
225
226 # Symbols are not unique, if there are several hits for the from-unit, then
227 # the correct one must be determined by comparing it with the to-unit
228 # https://github.com/searxng/searxng/pull/3378#issuecomment-2080974863
229
230 # first: collecting possible units
231
232 source_list, target_list = [], []
233
234 for symbol, si_name, from_si, to_si, orig_symbol in symbol_to_si():
235
236 if symbol == measured.group('unit'):
237 source_list.append((si_name, to_si))
238 if symbol == to_query:
239 target_list.append((si_name, from_si, orig_symbol))
240
241 if not (source_list and target_list):
242 return None
243
244 source_to_si = target_from_si = target_symbol = None
245
246 # second: find the right unit by comparing list of from-units with list of to-units
247
248 for source in source_list:
249 for target in target_list:
250 if source[0] == target[0]: # compare si_name
251 source_to_si = source[1]
252 target_from_si = target[1]
253 target_symbol = target[2]
254
255 if not (source_to_si and target_from_si):
256 return None
257
258 _locale = get_locale() or 'en_US'
259
260 value = measured.group('sign') + measured.group('number') + (measured.group('E') or '')
261 value = babel.numbers.parse_decimal(value, locale=_locale)
262
263 # convert value to SI unit
264
265 if isinstance(source_to_si, (float, int)):
266 value = float(value) * source_to_si
267 else:
268 value = source_to_si(float(value))
269
270 # convert value from SI unit to target unit
271
272 if isinstance(target_from_si, (float, int)):
273 value = float(value) * target_from_si
274 else:
275 value = target_from_si(float(value))
276
277 if measured.group('E'):
278 # when incoming notation is scientific, outgoing notation is scientific
279 result = babel.numbers.format_scientific(value, locale=_locale)
280 else:
281 result = babel.numbers.format_decimal(value, locale=_locale, format='#,##0.##########;-#')
282
283 return f'{result} {target_symbol}'
EngineResults post_search(self, "SXNG_Request" request, "SearchWithPlugins" search)
None __init__(self, "PluginCfg" plg_cfg)
str|None _parse_text_and_convert(from_query, to_query)