summaryrefslogtreecommitdiff
path: root/searx/search/processors/online_dictionary.py
diff options
context:
space:
mode:
authorMarkus Heiser <markus.heiser@darmarit.de>2025-09-11 19:10:27 +0200
committerMarkus Heiser <markus.heiser@darmarIT.de>2025-09-18 19:40:03 +0200
commit8f8343dc0d78bb57215afc3e99fd9000fce6e0cf (patch)
tree7c0aa8587ed4bc47e403b4148a308191e2d21c55 /searx/search/processors/online_dictionary.py
parent23257bddce864cfc44d64324dee36b32b1cf5248 (diff)
[mod] addition of various type hints / engine processors
Continuation of #5147 .. typification of the engine processors. BTW: - removed obsolete engine property https_support - fixed & improved currency_convert - engine instances can now implement a engine.setup method [#5147] https://github.com/searxng/searxng/pull/5147 Signed-off-by: Markus Heiser <markus.heiser@darmarit.de>
Diffstat (limited to 'searx/search/processors/online_dictionary.py')
-rw-r--r--searx/search/processors/online_dictionary.py120
1 files changed, 81 insertions, 39 deletions
diff --git a/searx/search/processors/online_dictionary.py b/searx/search/processors/online_dictionary.py
index 968c180d0..5827296c6 100644
--- a/searx/search/processors/online_dictionary.py
+++ b/searx/search/processors/online_dictionary.py
@@ -1,60 +1,102 @@
# SPDX-License-Identifier: AGPL-3.0-or-later
-"""Processors for engine-type: ``online_dictionary``
-
-"""
+"""Processor used for ``online_dictionary`` engines."""
+import typing as t
import re
-from searx.utils import is_valid_lang
-from .online import OnlineProcessor
+from searx.sxng_locales import sxng_locales
+from .online import OnlineProcessor, OnlineParams
+
+if t.TYPE_CHECKING:
+ from searx.search.models import SearchQuery
+
+search_syntax = re.compile(r".*?([a-z]+)-([a-z]+) (.+)$", re.I)
+"""Search syntax used for from/to language (e.g. ``en-de``)"""
+
+FromToType: t.TypeAlias = tuple[bool, str, str]
+"""Type of a language descriptions in the context of a ``online_dictionary``."""
+
+
+class DictParams(t.TypedDict):
+ """Dictionary request parameters."""
+
+ from_lang: FromToType
+ """Language from which is to be translated."""
+
+ to_lang: FromToType
+ """Language to translate into."""
-parser_re = re.compile('.*?([a-z]+)-([a-z]+) (.+)$', re.I)
+ query: str
+ """Search term, cleaned of search syntax (*from-to* has been removed)."""
+
+
+class OnlineDictParams(DictParams, OnlineParams): # pylint: disable=duplicate-bases
+ """Request parameters of a ``online_dictionary`` engine."""
class OnlineDictionaryProcessor(OnlineProcessor):
- """Processor class used by ``online_dictionary`` engines."""
+ """Processor class for ``online_dictionary`` engines."""
- engine_type = 'online_dictionary'
+ engine_type: str = "online_dictionary"
- def get_params(self, search_query, engine_category):
- """Returns a set of :ref:`request params <engine request online_dictionary>` or
- ``None`` if search query does not match to :py:obj:`parser_re`.
- """
- params = super().get_params(search_query, engine_category)
- if params is None:
- return None
+ def get_params(self, search_query: "SearchQuery", engine_category: str) -> OnlineDictParams | None:
+ """Returns a dictionary with the :ref:`request params <engine request
+ online_dictionary>` (:py:obj:`OnlineDictParams`). ``None`` is returned
+ if the search query does not match :py:obj:`search_syntax`."""
- m = parser_re.match(search_query.query)
+ online_params: OnlineParams | None = super().get_params(search_query, engine_category)
+ if online_params is None:
+ return None
+ m = search_syntax.match(search_query.query)
if not m:
return None
from_lang, to_lang, query = m.groups()
-
- from_lang = is_valid_lang(from_lang)
- to_lang = is_valid_lang(to_lang)
-
+ from_lang = _get_lang_descr(from_lang)
+ to_lang = _get_lang_descr(to_lang)
if not from_lang or not to_lang:
return None
- params['from_lang'] = from_lang
- params['to_lang'] = to_lang
- params['query'] = query
+ params: OnlineDictParams = {
+ **online_params,
+ "from_lang": from_lang,
+ "to_lang": to_lang,
+ "query": query,
+ }
return params
- def get_default_tests(self):
- tests = {}
-
- if getattr(self.engine, 'paging', False):
- tests['translation_paging'] = {
- 'matrix': {'query': 'en-es house', 'pageno': (1, 2, 3)},
- 'result_container': ['not_empty', ('one_title_contains', 'house')],
- 'test': ['unique_results'],
- }
- else:
- tests['translation'] = {
- 'matrix': {'query': 'en-es house'},
- 'result_container': ['not_empty', ('one_title_contains', 'house')],
- }
-
- return tests
+
+def _get_lang_descr(lang: str) -> FromToType | None:
+ """Returns language's code and language's english name if argument ``lang``
+ describes a language known by SearXNG, otherwise ``None``.
+
+ Examples:
+
+ .. code:: python
+
+ >>> _get_lang_descr("zz")
+ None
+ >>> _get_lang_descr("uk")
+ (True, "uk", "ukrainian")
+ >>> _get_lang_descr(b"uk")
+ (True, "uk", "ukrainian")
+ >>> _get_lang_descr("en")
+ (True, "en", "english")
+ >>> _get_lang_descr("EspaƱol")
+ (True, "es", "spanish")
+ >>> _get_lang_descr("Spanish")
+ (True, "es", "spanish")
+
+ """
+ lang = lang.lower()
+ is_abbr = len(lang) == 2
+ if is_abbr:
+ for l in sxng_locales:
+ if l[0][:2] == lang:
+ return (True, l[0][:2], l[3].lower())
+ return None
+ for l in sxng_locales:
+ if l[1].lower() == lang or l[3].lower() == lang:
+ return (True, l[0][:2], l[3].lower())
+ return None