From a800dd04735c98a293edff00493a5fee3dfeaed7 Mon Sep 17 00:00:00 2001 From: Markus Heiser Date: Sun, 4 May 2025 20:37:06 +0200 Subject: [mod] implement searx.wikidata_units for unit converters --- searx/plugins/unit_converter.py | 128 +--------------------------------------- 1 file changed, 1 insertion(+), 127 deletions(-) (limited to 'searx/plugins') diff --git a/searx/plugins/unit_converter.py b/searx/plugins/unit_converter.py index 2bab598f2..0072afe55 100644 --- a/searx/plugins/unit_converter.py +++ b/searx/plugins/unit_converter.py @@ -15,7 +15,7 @@ import babel.numbers from flask_babel import gettext, get_locale -from searx import data +from searx.units import symbol_to_si from searx.plugins import Plugin, PluginInfo from searx.result_types import EngineResults @@ -86,132 +86,6 @@ RE_MEASURE = r''' ''' -ADDITIONAL_UNITS = [ - { - "si_name": "Q11579", - "symbol": "°C", - "to_si": lambda val: val + 273.15, - "from_si": lambda val: val - 273.15, - }, - { - "si_name": "Q11579", - "symbol": "°F", - "to_si": lambda val: (val + 459.67) * 5 / 9, - "from_si": lambda val: (val * 9 / 5) - 459.67, - }, -] -"""Additional items to convert from a measure unit to a SI unit (vice versa). - -.. code:: python - - { - "si_name": "Q11579", # Wikidata item ID of the SI unit (Kelvin) - "symbol": "°C", # symbol of the measure unit - "to_si": lambda val: val + 273.15, # convert measure value (val) to SI unit - "from_si": lambda val: val - 273.15, # convert SI value (val) measure unit - }, - { - "si_name": "Q11573", - "symbol": "mi", - "to_si": 1609.344, # convert measure value (val) to SI unit - "from_si": 1 / 1609.344 # convert SI value (val) measure unit - }, - -The values of ``to_si`` and ``from_si`` can be of :py:obj:`float` (a multiplier) -or a callable_ (val in / converted value returned). - -.. _callable: https://docs.python.org/3/glossary.html#term-callable -""" - - -ALIAS_SYMBOLS = { - '°C': ('C',), - '°F': ('F',), - 'mi': ('L',), -} -"""Alias symbols for known unit of measure symbols / by example:: - - '°C': ('C', ...), # list of alias symbols for °C (Q69362731) - '°F': ('F', ...), # list of alias symbols for °F (Q99490479) - 'mi': ('L',), # list of alias symbols for mi (Q253276) -""" - - -SYMBOL_TO_SI = [] - - -def symbol_to_si(): - """Generates a list of tuples, each tuple is a measure unit and the fields - in the tuple are: - - 0. Symbol of the measure unit (e.g. 'mi' for measure unit 'miles' Q253276) - - 1. SI name of the measure unit (e.g. Q11573 for SI unit 'metre') - - 2. Factor to get SI value from measure unit (e.g. 1mi is equal to SI 1m - multiplied by 1609.344) - - 3. Factor to get measure value from from SI value (e.g. SI 100m is equal to - 100mi divided by 1609.344) - - The returned list is sorted, the first items are created from - ``WIKIDATA_UNITS``, the second group of items is build from - :py:obj:`ADDITIONAL_UNITS` and items created from :py:obj:`ALIAS_SYMBOLS`. - - If you search this list for a symbol, then a match with a symbol from - Wikidata has the highest weighting (first hit in the list), followed by the - symbols from the :py:obj:`ADDITIONAL_UNITS` and the lowest weighting is - given to the symbols resulting from the aliases :py:obj:`ALIAS_SYMBOLS`. - - """ - - global SYMBOL_TO_SI # pylint: disable=global-statement - if SYMBOL_TO_SI: - return SYMBOL_TO_SI - - # filter out units which can't be normalized to a SI unit and filter out - # units without a symbol / arcsecond does not have a symbol - # https://www.wikidata.org/wiki/Q829073 - - for item in data.WIKIDATA_UNITS.values(): - if item['to_si_factor'] and item['symbol']: - SYMBOL_TO_SI.append( - ( - item['symbol'], - item['si_name'], - 1 / item['to_si_factor'], # from_si - item['to_si_factor'], # to_si - item['symbol'], - ) - ) - - for item in ADDITIONAL_UNITS: - SYMBOL_TO_SI.append( - ( - item['symbol'], - item['si_name'], - item['from_si'], - item['to_si'], - item['symbol'], - ) - ) - - alias_items = [] - for item in SYMBOL_TO_SI: - for alias in ALIAS_SYMBOLS.get(item[0], ()): - alias_items.append( - ( - alias, - item[1], - item[2], # from_si - item[3], # to_si - item[0], # origin unit - ) - ) - SYMBOL_TO_SI = SYMBOL_TO_SI + alias_items - return SYMBOL_TO_SI - - def _parse_text_and_convert(from_query, to_query) -> str | None: # pylint: disable=too-many-branches, too-many-locals -- cgit v1.2.3