unit_converter.py 8.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264
  1. # SPDX-License-Identifier: AGPL-3.0-or-later
  2. """A plugin for converting measured values from one unit to another unit (a
  3. unit converter).
  4. The plugin looks up the symbols (given in the query term) in a list of
  5. converters, each converter is one item in the list (compare
  6. :py:obj:`ADDITIONAL_UNITS`). If the symbols are ambiguous, the matching units
  7. of measurement are evaluated. The weighting in the evaluation results from the
  8. sorting of the :py:obj:`list of unit converters<symbol_to_si>`.
  9. Enable in ``settings.yml``:
  10. .. code:: yaml
  11. enabled_plugins:
  12. ..
  13. - 'Unit converter plugin'
  14. """
  15. import re
  16. import babel.numbers
  17. from flask_babel import gettext, get_locale
  18. from searx import data
  19. name = "Unit converter plugin"
  20. description = gettext("Convert between units")
  21. default_on = True
  22. plugin_id = "unit_converter"
  23. preference_section = "general"
  24. CONVERT_KEYWORDS = ["in", "to", "as"]
  25. # inspired from https://stackoverflow.com/a/42475086
  26. RE_MEASURE = r'''
  27. (?P<sign>[-+]?) # +/- or nothing for positive
  28. (\s*) # separator: white space or nothing
  29. (?P<number>[\d\.,]*) # number: 1,000.00 (en) or 1.000,00 (de)
  30. (?P<E>[eE][-+]?\d+)? # scientific notation: e(+/-)2 (*10^2)
  31. (\s*) # separator: white space or nothing
  32. (?P<unit>\S+) # unit of measure
  33. '''
  34. ADDITIONAL_UNITS = [
  35. {
  36. "si_name": "Q11579",
  37. "symbol": "°C",
  38. "to_si": lambda val: val + 273.15,
  39. "from_si": lambda val: val - 273.15,
  40. },
  41. {
  42. "si_name": "Q11579",
  43. "symbol": "°F",
  44. "to_si": lambda val: (val + 459.67) * 5 / 9,
  45. "from_si": lambda val: (val * 9 / 5) - 459.67,
  46. },
  47. ]
  48. """Additional items to convert from a measure unit to a SI unit (vice versa).
  49. .. code:: python
  50. {
  51. "si_name": "Q11579", # Wikidata item ID of the SI unit (Kelvin)
  52. "symbol": "°C", # symbol of the measure unit
  53. "to_si": lambda val: val + 273.15, # convert measure value (val) to SI unit
  54. "from_si": lambda val: val - 273.15, # convert SI value (val) measure unit
  55. },
  56. {
  57. "si_name": "Q11573",
  58. "symbol": "mi",
  59. "to_si": 1609.344, # convert measure value (val) to SI unit
  60. "from_si": 1 / 1609.344 # convert SI value (val) measure unit
  61. },
  62. The values of ``to_si`` and ``from_si`` can be of :py:obj:`float` (a multiplier)
  63. or a callable_ (val in / converted value returned).
  64. .. _callable: https://docs.python.org/3/glossary.html#term-callable
  65. """
  66. ALIAS_SYMBOLS = {
  67. '°C': ('C',),
  68. '°F': ('F',),
  69. 'mi': ('L',),
  70. }
  71. """Alias symbols for known unit of measure symbols / by example::
  72. '°C': ('C', ...), # list of alias symbols for °C (Q69362731)
  73. '°F': ('F', ...), # list of alias symbols for °F (Q99490479)
  74. 'mi': ('L',), # list of alias symbols for mi (Q253276)
  75. """
  76. SYMBOL_TO_SI = []
  77. def symbol_to_si():
  78. """Generates a list of tuples, each tuple is a measure unit and the fields
  79. in the tuple are:
  80. 0. Symbol of the measure unit (e.g. 'mi' for measure unit 'miles' Q253276)
  81. 1. SI name of the measure unit (e.g. Q11573 for SI unit 'metre')
  82. 2. Factor to get SI value from measure unit (e.g. 1mi is equal to SI 1m
  83. multiplied by 1609.344)
  84. 3. Factor to get measure value from from SI value (e.g. SI 100m is equal to
  85. 100mi divided by 1609.344)
  86. The returned list is sorted, the first items are created from
  87. ``WIKIDATA_UNITS``, the second group of items is build from
  88. :py:obj:`ADDITIONAL_UNITS` and items created from :py:obj:`ALIAS_SYMBOLS`.
  89. If you search this list for a symbol, then a match with a symbol from
  90. Wikidata has the highest weighting (first hit in the list), followed by the
  91. symbols from the :py:obj:`ADDITIONAL_UNITS` and the lowest weighting is
  92. given to the symbols resulting from the aliases :py:obj:`ALIAS_SYMBOLS`.
  93. """
  94. global SYMBOL_TO_SI # pylint: disable=global-statement
  95. if SYMBOL_TO_SI:
  96. return SYMBOL_TO_SI
  97. # filter out units which can't be normalized to a SI unit and filter out
  98. # units without a symbol / arcsecond does not have a symbol
  99. # https://www.wikidata.org/wiki/Q829073
  100. for item in data.WIKIDATA_UNITS.values():
  101. if item['to_si_factor'] and item['symbol']:
  102. SYMBOL_TO_SI.append(
  103. (
  104. item['symbol'],
  105. item['si_name'],
  106. 1 / item['to_si_factor'], # from_si
  107. item['to_si_factor'], # to_si
  108. item['symbol'],
  109. )
  110. )
  111. for item in ADDITIONAL_UNITS:
  112. SYMBOL_TO_SI.append(
  113. (
  114. item['symbol'],
  115. item['si_name'],
  116. item['from_si'],
  117. item['to_si'],
  118. item['symbol'],
  119. )
  120. )
  121. alias_items = []
  122. for item in SYMBOL_TO_SI:
  123. for alias in ALIAS_SYMBOLS.get(item[0], ()):
  124. alias_items.append(
  125. (
  126. alias,
  127. item[1],
  128. item[2], # from_si
  129. item[3], # to_si
  130. item[0], # origin unit
  131. )
  132. )
  133. SYMBOL_TO_SI = SYMBOL_TO_SI + alias_items
  134. return SYMBOL_TO_SI
  135. def _parse_text_and_convert(search, from_query, to_query):
  136. # pylint: disable=too-many-branches, too-many-locals
  137. if not (from_query and to_query):
  138. return
  139. measured = re.match(RE_MEASURE, from_query, re.VERBOSE)
  140. if not (measured and measured.group('number'), measured.group('unit')):
  141. return
  142. # Symbols are not unique, if there are several hits for the from-unit, then
  143. # the correct one must be determined by comparing it with the to-unit
  144. # https://github.com/searxng/searxng/pull/3378#issuecomment-2080974863
  145. # first: collecting possible units
  146. source_list, target_list = [], []
  147. for symbol, si_name, from_si, to_si, orig_symbol in symbol_to_si():
  148. if symbol == measured.group('unit'):
  149. source_list.append((si_name, to_si))
  150. if symbol == to_query:
  151. target_list.append((si_name, from_si, orig_symbol))
  152. if not (source_list and target_list):
  153. return
  154. source_to_si = target_from_si = target_symbol = None
  155. # second: find the right unit by comparing list of from-units with list of to-units
  156. for source in source_list:
  157. for target in target_list:
  158. if source[0] == target[0]: # compare si_name
  159. source_to_si = source[1]
  160. target_from_si = target[1]
  161. target_symbol = target[2]
  162. if not (source_to_si and target_from_si):
  163. return
  164. _locale = get_locale() or 'en_US'
  165. value = measured.group('sign') + measured.group('number') + (measured.group('E') or '')
  166. value = babel.numbers.parse_decimal(value, locale=_locale)
  167. # convert value to SI unit
  168. if isinstance(source_to_si, (float, int)):
  169. value = float(value) * source_to_si
  170. else:
  171. value = source_to_si(float(value))
  172. # convert value from SI unit to target unit
  173. if isinstance(target_from_si, (float, int)):
  174. value = float(value) * target_from_si
  175. else:
  176. value = target_from_si(float(value))
  177. if measured.group('E'):
  178. # when incoming notation is scientific, outgoing notation is scientific
  179. result = babel.numbers.format_scientific(value, locale=_locale)
  180. else:
  181. result = babel.numbers.format_decimal(value, locale=_locale, format='#,##0.##########;-#')
  182. search.result_container.answers['conversion'] = {'answer': f'{result} {target_symbol}'}
  183. def post_search(_request, search):
  184. # only convert between units on the first page
  185. if search.search_query.pageno > 1:
  186. return True
  187. query = search.search_query.query
  188. query_parts = query.split(" ")
  189. if len(query_parts) < 3:
  190. return True
  191. for query_part in query_parts:
  192. for keyword in CONVERT_KEYWORDS:
  193. if query_part == keyword:
  194. from_query, to_query = query.split(keyword, 1)
  195. _parse_text_and_convert(search, from_query.strip(), to_query.strip())
  196. return True
  197. return True