123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251 |
- # SPDX-License-Identifier: AGPL-3.0-or-later
- """Engine's traits are fetched from the origin engines and stored in a JSON file
- in the *data folder*. Most often traits are languages and region codes and
- their mapping from SearXNG's representation to the representation in the origin
- search engine. For new traits new properties can be added to the class
- :py:class:`EngineTraits`.
- To load traits from the persistence :py:obj:`EngineTraitsMap.from_data` can be
- used.
- """
- from __future__ import annotations
- import json
- import dataclasses
- import types
- from typing import Dict, Literal, Iterable, Union, Callable, Optional, TYPE_CHECKING
- from searx import locales
- from searx.data import data_dir, ENGINE_TRAITS
- if TYPE_CHECKING:
- from . import Engine
- class EngineTraitsEncoder(json.JSONEncoder):
- """Encodes :class:`EngineTraits` to a serializable object, see
- :class:`json.JSONEncoder`."""
- def default(self, o):
- """Return dictionary of a :class:`EngineTraits` object."""
- if isinstance(o, EngineTraits):
- return o.__dict__
- return super().default(o)
- @dataclasses.dataclass
- class EngineTraits:
- """The class is intended to be instantiated for each engine."""
- regions: Dict[str, str] = dataclasses.field(default_factory=dict)
- """Maps SearXNG's internal representation of a region to the one of the engine.
- SearXNG's internal representation can be parsed by babel and the value is
- send to the engine:
- .. code:: python
- regions ={
- 'fr-BE' : <engine's region name>,
- }
- for key, egnine_region regions.items():
- searxng_region = babel.Locale.parse(key, sep='-')
- ...
- """
- languages: Dict[str, str] = dataclasses.field(default_factory=dict)
- """Maps SearXNG's internal representation of a language to the one of the engine.
- SearXNG's internal representation can be parsed by babel and the value is
- send to the engine:
- .. code:: python
- languages = {
- 'ca' : <engine's language name>,
- }
- for key, egnine_lang in languages.items():
- searxng_lang = babel.Locale.parse(key)
- ...
- """
- all_locale: Optional[str] = None
- """To which locale value SearXNG's ``all`` language is mapped (shown a "Default
- language").
- """
- data_type: Literal['traits_v1'] = 'traits_v1'
- """Data type, default is 'traits_v1'.
- """
- custom: Dict[str, Union[Dict[str, Dict], Iterable[str]]] = dataclasses.field(default_factory=dict)
- """A place to store engine's custom traits, not related to the SearXNG core.
- """
- def get_language(self, searxng_locale: str, default=None):
- """Return engine's language string that *best fits* to SearXNG's locale.
- :param searxng_locale: SearXNG's internal representation of locale
- selected by the user.
- :param default: engine's default language
- The *best fits* rules are implemented in
- :py:obj:`searx.locales.get_engine_locale`. Except for the special value ``all``
- which is determined from :py:obj:`EngineTraits.all_locale`.
- """
- if searxng_locale == 'all' and self.all_locale is not None:
- return self.all_locale
- return locales.get_engine_locale(searxng_locale, self.languages, default=default)
- def get_region(self, searxng_locale: str, default=None):
- """Return engine's region string that best fits to SearXNG's locale.
- :param searxng_locale: SearXNG's internal representation of locale
- selected by the user.
- :param default: engine's default region
- The *best fits* rules are implemented in
- :py:obj:`searx.locales.get_engine_locale`. Except for the special value ``all``
- which is determined from :py:obj:`EngineTraits.all_locale`.
- """
- if searxng_locale == 'all' and self.all_locale is not None:
- return self.all_locale
- return locales.get_engine_locale(searxng_locale, self.regions, default=default)
- def is_locale_supported(self, searxng_locale: str) -> bool:
- """A *locale* (SearXNG's internal representation) is considered to be
- supported by the engine if the *region* or the *language* is supported
- by the engine.
- For verification the functions :py:func:`EngineTraits.get_region` and
- :py:func:`EngineTraits.get_language` are used.
- """
- if self.data_type == 'traits_v1':
- return bool(self.get_region(searxng_locale) or self.get_language(searxng_locale))
- raise TypeError('engine traits of type %s is unknown' % self.data_type)
- def copy(self):
- """Create a copy of the dataclass object."""
- return EngineTraits(**dataclasses.asdict(self))
- @classmethod
- def fetch_traits(cls, engine: Engine) -> Union['EngineTraits', None]:
- """Call a function ``fetch_traits(engine_traits)`` from engines namespace to fetch
- and set properties from the origin engine in the object ``engine_traits``. If
- function does not exists, ``None`` is returned.
- """
- fetch_traits = getattr(engine, 'fetch_traits', None)
- engine_traits = None
- if fetch_traits:
- engine_traits = cls()
- fetch_traits(engine_traits)
- return engine_traits
- def set_traits(self, engine: Engine):
- """Set traits from self object in a :py:obj:`.Engine` namespace.
- :param engine: engine instance build by :py:func:`searx.engines.load_engine`
- """
- if self.data_type == 'traits_v1':
- self._set_traits_v1(engine)
- else:
- raise TypeError('engine traits of type %s is unknown' % self.data_type)
- def _set_traits_v1(self, engine: Engine):
- # For an engine, when there is `language: ...` in the YAML settings the engine
- # does support only this one language (region)::
- #
- # - name: google italian
- # engine: google
- # language: it
- # region: it-IT # type: ignore
- traits = self.copy()
- _msg = "settings.yml - engine: '%s' / %s: '%s' not supported"
- languages = traits.languages
- if hasattr(engine, 'language'):
- if engine.language not in languages:
- raise ValueError(_msg % (engine.name, 'language', engine.language))
- traits.languages = {engine.language: languages[engine.language]}
- regions = traits.regions
- if hasattr(engine, 'region'):
- if engine.region not in regions:
- raise ValueError(_msg % (engine.name, 'region', engine.region))
- traits.regions = {engine.region: regions[engine.region]}
- engine.language_support = bool(traits.languages or traits.regions)
- # set the copied & modified traits in engine's namespace
- engine.traits = traits
- class EngineTraitsMap(Dict[str, EngineTraits]):
- """A python dictionary to map :class:`EngineTraits` by engine name."""
- ENGINE_TRAITS_FILE = (data_dir / 'engine_traits.json').resolve()
- """File with persistence of the :py:obj:`EngineTraitsMap`."""
- def save_data(self):
- """Store EngineTraitsMap in in file :py:obj:`self.ENGINE_TRAITS_FILE`"""
- with open(self.ENGINE_TRAITS_FILE, 'w', encoding='utf-8') as f:
- json.dump(self, f, indent=2, sort_keys=True, cls=EngineTraitsEncoder)
- @classmethod
- def from_data(cls) -> 'EngineTraitsMap':
- """Instantiate :class:`EngineTraitsMap` object from :py:obj:`ENGINE_TRAITS`"""
- obj = cls()
- for k, v in ENGINE_TRAITS.items():
- obj[k] = EngineTraits(**v)
- return obj
- @classmethod
- def fetch_traits(cls, log: Callable) -> 'EngineTraitsMap':
- from searx import engines # pylint: disable=cyclic-import, import-outside-toplevel
- names = list(engines.engines)
- names.sort()
- obj = cls()
- for engine_name in names:
- engine = engines.engines[engine_name]
- traits = EngineTraits.fetch_traits(engine)
- if traits is not None:
- log("%-20s: SearXNG languages --> %s " % (engine_name, len(traits.languages)))
- log("%-20s: SearXNG regions --> %s" % (engine_name, len(traits.regions)))
- obj[engine_name] = traits
- return obj
- def set_traits(self, engine: Engine | types.ModuleType):
- """Set traits in a :py:obj:`Engine` namespace.
- :param engine: engine instance build by :py:func:`searx.engines.load_engine`
- """
- engine_traits = EngineTraits(data_type='traits_v1')
- if engine.name in self.keys():
- engine_traits = self[engine.name]
- elif engine.engine in self.keys():
- # The key of the dictionary traits_map is the *engine name*
- # configured in settings.xml. When multiple engines are configured
- # in settings.yml to use the same origin engine (python module)
- # these additional engines can use the languages from the origin
- # engine. For this use the configured ``engine: ...`` from
- # settings.yml
- engine_traits = self[engine.engine]
- engine_traits.set_traits(engine)
|