.oO SearXNG Developer Documentation Oo.
Loading...
Searching...
No Matches
traits.py
Go to the documentation of this file.
1# SPDX-License-Identifier: AGPL-3.0-or-later
2"""Engine's traits are fetched from the origin engines and stored in a JSON file
3in the *data folder*. Most often traits are languages and region codes and
4their mapping from SearXNG's representation to the representation in the origin
5search engine. For new traits new properties can be added to the class
6:py:class:`EngineTraits`.
7
8To load traits from the persistence :py:obj:`EngineTraitsMap.from_data` can be
9used.
10"""
11
12from __future__ import annotations
13
14import os
15import json
16import dataclasses
17import types
18from typing import Dict, Literal, Iterable, Union, Callable, Optional, TYPE_CHECKING
19
20from searx import locales
21from searx.data import data_dir, ENGINE_TRAITS
22
23if TYPE_CHECKING:
24 from . import Engine
25
26
27class EngineTraitsEncoder(json.JSONEncoder):
28 """Encodes :class:`EngineTraits` to a serializable object, see
29 :class:`json.JSONEncoder`."""
30
31 def default(self, o):
32 """Return dictionary of a :class:`EngineTraits` object."""
33 if isinstance(o, EngineTraits):
34 return o.__dict__
35 return super().default(o)
36
37
38@dataclasses.dataclass
40 """The class is intended to be instantiated for each engine."""
41
42 regions: Dict[str, str] = dataclasses.field(default_factory=dict)
43 """Maps SearXNG's internal representation of a region to the one of the engine.
44
45 SearXNG's internal representation can be parsed by babel and the value is
46 send to the engine:
47
48 .. code:: python
49
50 regions ={
51 'fr-BE' : <engine's region name>,
52 }
53
54 for key, egnine_region regions.items():
55 searxng_region = babel.Locale.parse(key, sep='-')
56 ...
57 """
58
59 languages: Dict[str, str] = dataclasses.field(default_factory=dict)
60 """Maps SearXNG's internal representation of a language to the one of the engine.
61
62 SearXNG's internal representation can be parsed by babel and the value is
63 send to the engine:
64
65 .. code:: python
66
67 languages = {
68 'ca' : <engine's language name>,
69 }
70
71 for key, egnine_lang in languages.items():
72 searxng_lang = babel.Locale.parse(key)
73 ...
74 """
75
76 all_locale: Optional[str] = None
77 """To which locale value SearXNG's ``all`` language is mapped (shown a "Default
78 language").
79 """
80
81 data_type: Literal['traits_v1'] = 'traits_v1'
82 """Data type, default is 'traits_v1'.
83 """
84
85 custom: Dict[str, Union[Dict[str, Dict], Iterable[str]]] = dataclasses.field(default_factory=dict)
86 """A place to store engine's custom traits, not related to the SearXNG core.
87 """
88
89 def get_language(self, searxng_locale: str, default=None):
90 """Return engine's language string that *best fits* to SearXNG's locale.
91
92 :param searxng_locale: SearXNG's internal representation of locale
93 selected by the user.
94
95 :param default: engine's default language
96
97 The *best fits* rules are implemented in
98 :py:obj:`searx.locales.get_engine_locale`. Except for the special value ``all``
99 which is determined from :py:obj:`EngineTraits.all_locale`.
100 """
101 if searxng_locale == 'all' and self.all_locale is not None:
102 return self.all_locale
103 return locales.get_engine_locale(searxng_locale, self.languages, default=default)
104
105 def get_region(self, searxng_locale: str, default=None):
106 """Return engine's region string that best fits to SearXNG's locale.
107
108 :param searxng_locale: SearXNG's internal representation of locale
109 selected by the user.
110
111 :param default: engine's default region
112
113 The *best fits* rules are implemented in
114 :py:obj:`searx.locales.get_engine_locale`. Except for the special value ``all``
115 which is determined from :py:obj:`EngineTraits.all_locale`.
116 """
117 if searxng_locale == 'all' and self.all_locale is not None:
118 return self.all_locale
119 return locales.get_engine_locale(searxng_locale, self.regions, default=default)
120
121 def is_locale_supported(self, searxng_locale: str) -> bool:
122 """A *locale* (SearXNG's internal representation) is considered to be
123 supported by the engine if the *region* or the *language* is supported
124 by the engine.
125
126 For verification the functions :py:func:`EngineTraits.get_region` and
127 :py:func:`EngineTraits.get_language` are used.
128 """
129 if self.data_type == 'traits_v1':
130 return bool(self.get_region(searxng_locale) or self.get_language(searxng_locale))
131
132 raise TypeError('engine traits of type %s is unknown' % self.data_type)
133
134 def copy(self):
135 """Create a copy of the dataclass object."""
136 return EngineTraits(**dataclasses.asdict(self))
137
138 @classmethod
139 def fetch_traits(cls, engine: Engine) -> Union['EngineTraits', None]:
140 """Call a function ``fetch_traits(engine_traits)`` from engines namespace to fetch
141 and set properties from the origin engine in the object ``engine_traits``. If
142 function does not exists, ``None`` is returned.
143 """
144
145 fetch_traits = getattr(engine, 'fetch_traits', None)
146 engine_traits = None
147
148 if fetch_traits:
149 engine_traits = cls()
150 fetch_traits(engine_traits)
151 return engine_traits
152
153 def set_traits(self, engine: Engine):
154 """Set traits from self object in a :py:obj:`.Engine` namespace.
155
156 :param engine: engine instance build by :py:func:`searx.engines.load_engine`
157 """
158
159 if self.data_type == 'traits_v1':
160 self._set_traits_v1(engine)
161 else:
162 raise TypeError('engine traits of type %s is unknown' % self.data_type)
163
164 def _set_traits_v1(self, engine: Engine):
165 # For an engine, when there is `language: ...` in the YAML settings the engine
166 # does support only this one language (region)::
167 #
168 # - name: google italian
169 # engine: google
170 # language: it
171 # region: it-IT # type: ignore
172
173 traits = self.copy()
174
175 _msg = "settings.yml - engine: '%s' / %s: '%s' not supported"
176
177 languages = traits.languages
178 if hasattr(engine, 'language'):
179 if engine.language not in languages:
180 raise ValueError(_msg % (engine.name, 'language', engine.language))
181 traits.languages = {engine.language: languages[engine.language]}
182
183 regions = traits.regions
184 if hasattr(engine, 'region'):
185 if engine.region not in regions:
186 raise ValueError(_msg % (engine.name, 'region', engine.region))
187 traits.regions = {engine.region: regions[engine.region]}
188
189 engine.language_support = bool(traits.languages or traits.regions)
190
191 # set the copied & modified traits in engine's namespace
192 engine.traits = traits
193
194
195class EngineTraitsMap(Dict[str, EngineTraits]):
196 """A python dictionary to map :class:`EngineTraits` by engine name."""
197
198 ENGINE_TRAITS_FILE = (data_dir / 'engine_traits.json').resolve()
199 """File with persistence of the :py:obj:`EngineTraitsMap`."""
200
201 def save_data(self):
202 """Store EngineTraitsMap in in file :py:obj:`self.ENGINE_TRAITS_FILE`"""
203 with open(self.ENGINE_TRAITS_FILE, 'w', encoding='utf-8') as f:
204 json.dump(self, f, indent=2, sort_keys=True, cls=EngineTraitsEncoder)
205
206 @classmethod
207 def from_data(cls) -> 'EngineTraitsMap':
208 """Instantiate :class:`EngineTraitsMap` object from :py:obj:`ENGINE_TRAITS`"""
209 obj = cls()
210 for k, v in ENGINE_TRAITS.items():
211 obj[k] = EngineTraits(**v)
212 return obj
213
214 @classmethod
215 def fetch_traits(cls, log: Callable) -> 'EngineTraitsMap':
216 from searx import engines # pylint: disable=cyclic-import, import-outside-toplevel
217
218 names = list(engines.engines)
219 names.sort()
220 obj = cls()
221
222 for engine_name in names:
223 engine = engines.engines[engine_name]
224 traits = None
225
226 # pylint: disable=broad-exception-caught
227 try:
228 traits = EngineTraits.fetch_traits(engine)
229 except Exception as exc:
230 log("FATAL: while fetch_traits %s: %s" % (engine_name, exc))
231 if os.environ.get('FORCE', '').lower() not in ['on', 'true', '1']:
232 raise
233 v = ENGINE_TRAITS.get(engine_name)
234 if v:
235 log("FORCE: re-use old values from fetch_traits - ENGINE_TRAITS[%s]" % engine_name)
236 traits = EngineTraits(**v)
237
238 if traits is not None:
239 log("%-20s: SearXNG languages --> %s " % (engine_name, len(traits.languages)))
240 log("%-20s: SearXNG regions --> %s" % (engine_name, len(traits.regions)))
241 obj[engine_name] = traits
242
243 return obj
244
245 def set_traits(self, engine: Engine | types.ModuleType):
246 """Set traits in a :py:obj:`Engine` namespace.
247
248 :param engine: engine instance build by :py:func:`searx.engines.load_engine`
249 """
250
251 engine_traits = EngineTraits(data_type='traits_v1')
252 if engine.name in self.keys():
253 engine_traits = self[engine.name]
254
255 elif engine.engine in self.keys():
256 # The key of the dictionary traits_map is the *engine name*
257 # configured in settings.xml. When multiple engines are configured
258 # in settings.yml to use the same origin engine (python module)
259 # these additional engines can use the languages from the origin
260 # engine. For this use the configured ``engine: ...`` from
261 # settings.yml
262 engine_traits = self[engine.engine]
263
264 engine_traits.set_traits(engine)
'EngineTraitsMap' fetch_traits(cls, Callable log)
Definition traits.py:215
'EngineTraitsMap' from_data(cls)
Definition traits.py:207
set_traits(self, Engine|types.ModuleType engine)
Definition traits.py:245
_set_traits_v1(self, Engine engine)
Definition traits.py:164
get_region(self, str searxng_locale, default=None)
Definition traits.py:105
bool is_locale_supported(self, str searxng_locale)
Definition traits.py:121
get_language(self, str searxng_locale, default=None)
Definition traits.py:89
Union[ 'EngineTraits', None] fetch_traits(cls, Engine engine)
Definition traits.py:139
set_traits(self, Engine engine)
Definition traits.py:153