unit_converter.py 8.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260
  1. # SPDX-License-Identifier: AGPL-3.0-or-later
  2. """A plugin for converting measured values from one unit to another unit (a
  3. unit converter).
  4. The plugin looks up the symbols (given in the query term) in a list of
  5. converters, each converter is one item in the list (compare
  6. :py:obj:`ADDITIONAL_UNITS`). If the symbols are ambiguous, the matching units
  7. of measurement are evaluated. The weighting in the evaluation results from the
  8. sorting of the :py:obj:`list of unit converters<symbol_to_si>`.
  9. Enable in ``settings.yml``:
  10. .. code:: yaml
  11. enabled_plugins:
  12. ..
  13. - 'Unit converter plugin'
  14. """
  15. import re
  16. import babel.numbers
  17. from flask_babel import gettext, get_locale
  18. from searx import data
  19. name = "Unit converter plugin"
  20. description = gettext("Convert between units")
  21. default_on = True
  22. CONVERT_KEYWORDS = ["in", "to", "as"]
  23. # inspired from https://stackoverflow.com/a/42475086
  24. RE_MEASURE = r'''
  25. (?P<sign>[-+]?) # +/- or nothing for positive
  26. (\s*) # separator: white space or nothing
  27. (?P<number>[\d\.,]*) # number: 1,000.00 (en) or 1.000,00 (de)
  28. (?P<E>[eE][-+]?\d+)? # scientific notation: e(+/-)2 (*10^2)
  29. (\s*) # separator: white space or nothing
  30. (?P<unit>\S+) # unit of measure
  31. '''
  32. ADDITIONAL_UNITS = [
  33. {
  34. "si_name": "Q11579",
  35. "symbol": "°C",
  36. "to_si": lambda val: val + 273.15,
  37. "from_si": lambda val: val - 273.15,
  38. },
  39. {
  40. "si_name": "Q11579",
  41. "symbol": "°F",
  42. "to_si": lambda val: (val + 459.67) * 5 / 9,
  43. "from_si": lambda val: (val * 9 / 5) - 459.67,
  44. },
  45. ]
  46. """Additional items to convert from a measure unit to a SI unit (vice versa).
  47. .. code:: python
  48. {
  49. "si_name": "Q11579", # Wikidata item ID of the SI unit (Kelvin)
  50. "symbol": "°C", # symbol of the measure unit
  51. "to_si": lambda val: val + 273.15, # convert measure value (val) to SI unit
  52. "from_si": lambda val: val - 273.15, # convert SI value (val) measure unit
  53. },
  54. {
  55. "si_name": "Q11573",
  56. "symbol": "mi",
  57. "to_si": 1609.344, # convert measure value (val) to SI unit
  58. "from_si": 1 / 1609.344 # convert SI value (val) measure unit
  59. },
  60. The values of ``to_si`` and ``from_si`` can be of :py:obj:`float` (a multiplier)
  61. or a callable_ (val in / converted value returned).
  62. .. _callable: https://docs.python.org/3/glossary.html#term-callable
  63. """
  64. ALIAS_SYMBOLS = {
  65. '°C': ('C',),
  66. '°F': ('F',),
  67. 'mi': ('L',),
  68. }
  69. """Alias symbols for known unit of measure symbols / by example::
  70. '°C': ('C', ...), # list of alias symbols for °C (Q69362731)
  71. '°F': ('F', ...), # list of alias symbols for °F (Q99490479)
  72. 'mi': ('L',), # list of alias symbols for mi (Q253276)
  73. """
  74. SYMBOL_TO_SI = []
  75. def symbol_to_si():
  76. """Generates a list of tuples, each tuple is a measure unit and the fields
  77. in the tuple are:
  78. 0. Symbol of the measure unit (e.g. 'mi' for measure unit 'miles' Q253276)
  79. 1. SI name of the measure unit (e.g. Q11573 for SI unit 'metre')
  80. 2. Factor to get SI value from measure unit (e.g. 1mi is equal to SI 1m
  81. multiplied by 1609.344)
  82. 3. Factor to get measure value from from SI value (e.g. SI 100m is equal to
  83. 100mi divided by 1609.344)
  84. The returned list is sorted, the first items are created from
  85. ``WIKIDATA_UNITS``, the second group of items is build from
  86. :py:obj:`ADDITIONAL_UNITS` and items created from :py:obj:`ALIAS_SYMBOLS`.
  87. If you search this list for a symbol, then a match with a symbol from
  88. Wikidata has the highest weighting (first hit in the list), followed by the
  89. symbols from the :py:obj:`ADDITIONAL_UNITS` and the lowest weighting is
  90. given to the symbols resulting from the aliases :py:obj:`ALIAS_SYMBOLS`.
  91. """
  92. global SYMBOL_TO_SI # pylint: disable=global-statement
  93. if SYMBOL_TO_SI:
  94. return SYMBOL_TO_SI
  95. # filter out units which can't be normalized to a SI unit and filter out
  96. # units without a symbol / arcsecond does not have a symbol
  97. # https://www.wikidata.org/wiki/Q829073
  98. for item in data.WIKIDATA_UNITS.values():
  99. if item['to_si_factor'] and item['symbol']:
  100. SYMBOL_TO_SI.append(
  101. (
  102. item['symbol'],
  103. item['si_name'],
  104. item['to_si_factor'], # from_si
  105. 1 / item['to_si_factor'], # to_si
  106. item['symbol'],
  107. )
  108. )
  109. for item in ADDITIONAL_UNITS:
  110. SYMBOL_TO_SI.append(
  111. (
  112. item['symbol'],
  113. item['si_name'],
  114. item['from_si'],
  115. item['to_si'],
  116. item['symbol'],
  117. )
  118. )
  119. alias_items = []
  120. for item in SYMBOL_TO_SI:
  121. for alias in ALIAS_SYMBOLS.get(item[0], ()):
  122. alias_items.append(
  123. (
  124. alias,
  125. item[1],
  126. item[2], # from_si
  127. item[3], # to_si
  128. item[0], # origin unit
  129. )
  130. )
  131. SYMBOL_TO_SI = SYMBOL_TO_SI + alias_items
  132. return SYMBOL_TO_SI
  133. def _parse_text_and_convert(search, from_query, to_query):
  134. # pylint: disable=too-many-branches, too-many-locals
  135. if not (from_query and to_query):
  136. return
  137. measured = re.match(RE_MEASURE, from_query, re.VERBOSE)
  138. if not (measured and measured.group('number'), measured.group('unit')):
  139. return
  140. # Symbols are not unique, if there are several hits for the from-unit, then
  141. # the correct one must be determined by comparing it with the to-unit
  142. # https://github.com/searxng/searxng/pull/3378#issuecomment-2080974863
  143. # first: collecting possible units
  144. source_list, target_list = [], []
  145. for symbol, si_name, from_si, to_si, orig_symbol in symbol_to_si():
  146. if symbol == measured.group('unit'):
  147. source_list.append((si_name, to_si))
  148. if symbol == to_query:
  149. target_list.append((si_name, from_si, orig_symbol))
  150. if not (source_list and target_list):
  151. return
  152. source_to_si = target_from_si = target_symbol = None
  153. # second: find the right unit by comparing list of from-units with list of to-units
  154. for source in source_list:
  155. for target in target_list:
  156. if source[0] == target[0]: # compare si_name
  157. source_to_si = source[1]
  158. target_from_si = target[1]
  159. target_symbol = target[2]
  160. if not (source_to_si and target_from_si):
  161. return
  162. _locale = get_locale() or 'en_US'
  163. value = measured.group('sign') + measured.group('number') + (measured.group('E') or '')
  164. value = babel.numbers.parse_decimal(value, locale=_locale)
  165. # convert value to SI unit
  166. if isinstance(source_to_si, (float, int)):
  167. value = float(value) * source_to_si
  168. else:
  169. value = source_to_si(float(value))
  170. # convert value from SI unit to target unit
  171. if isinstance(target_from_si, (float, int)):
  172. value = float(value) * target_from_si
  173. else:
  174. value = target_from_si(float(value))
  175. if measured.group('E'):
  176. # when incomming notation is scientific, outgoing notation is scientific
  177. result = babel.numbers.format_scientific(value, locale=_locale)
  178. else:
  179. result = babel.numbers.format_decimal(value, locale=_locale, format='#,##0.##########;-#')
  180. search.result_container.answers['conversion'] = {'answer': f'{result} {target_symbol}'}
  181. def post_search(_request, search):
  182. # only convert between units on the first page
  183. if search.search_query.pageno > 1:
  184. return True
  185. query = search.search_query.query
  186. query_parts = query.split(" ")
  187. if len(query_parts) < 3:
  188. return True
  189. for query_part in query_parts:
  190. for keyword in CONVERT_KEYWORDS:
  191. if query_part == keyword:
  192. from_query, to_query = query.split(keyword, 1)
  193. _parse_text_and_convert(search, from_query.strip(), to_query.strip())
  194. return True
  195. return True