wolframalpha_noapi.py 3.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133
  1. # SPDX-License-Identifier: AGPL-3.0-or-later
  2. """
  3. Wolfram|Alpha (Science)
  4. """
  5. from __future__ import annotations
  6. from json import loads
  7. from urllib.parse import urlencode
  8. from searx.network import get as http_get
  9. from searx.enginelib import EngineCache
  10. # about
  11. about = {
  12. "website": 'https://www.wolframalpha.com/',
  13. "wikidata_id": 'Q207006',
  14. "official_api_documentation": 'https://products.wolframalpha.com/api/',
  15. "use_official_api": False,
  16. "require_api_key": False,
  17. "results": 'JSON',
  18. }
  19. # search-url
  20. url = 'https://www.wolframalpha.com/'
  21. search_url = (
  22. url + 'input/json.jsp'
  23. '?async=false'
  24. '&banners=raw'
  25. '&debuggingdata=false'
  26. '&format=image,plaintext,imagemap,minput,moutput'
  27. '&formattimeout=2'
  28. '&{query}'
  29. '&output=JSON'
  30. '&parsetimeout=2'
  31. '&proxycode={token}'
  32. '&scantimeout=0.5'
  33. '&sponsorcategories=true'
  34. '&statemethod=deploybutton'
  35. )
  36. referer_url = url + 'input/?{query}'
  37. # pods to display as image in infobox
  38. # this pods do return a plaintext, but they look better and are more useful as images
  39. image_pods = {'VisualRepresentation', 'Illustration', 'Symbol'}
  40. CACHE: EngineCache
  41. """Persistent (SQLite) key/value cache that deletes its values after ``expire``
  42. seconds."""
  43. def init(engine_settings):
  44. global CACHE # pylint: disable=global-statement
  45. CACHE = EngineCache(engine_settings["name"]) # type:ignore
  46. def obtain_token() -> str:
  47. token = CACHE.get(key="token")
  48. if token is None:
  49. resp = http_get('https://www.wolframalpha.com/input/api/v1/code?ts=9999999999999999999', timeout=2.0)
  50. token = resp.json()["code"]
  51. # seems, wolframalpha resets its token in every hour
  52. CACHE.set(key="code", value=token, expire=3600)
  53. return token
  54. def request(query, params):
  55. token = obtain_token()
  56. params['url'] = search_url.format(query=urlencode({'input': query}), token=token)
  57. params['headers']['Referer'] = referer_url.format(query=urlencode({'i': query}))
  58. return params
  59. def response(resp):
  60. results = []
  61. resp_json = loads(resp.text)
  62. if not resp_json['queryresult']['success']:
  63. return []
  64. # handle resp_json['queryresult']['assumptions']?
  65. result_chunks = []
  66. infobox_title = ""
  67. result_content = ""
  68. for pod in resp_json['queryresult']['pods']:
  69. pod_id = pod.get('id', '')
  70. pod_title = pod.get('title', '')
  71. pod_is_result = pod.get('primary', None)
  72. if 'subpods' not in pod:
  73. continue
  74. if pod_id == 'Input' or not infobox_title:
  75. infobox_title = pod['subpods'][0]['plaintext']
  76. for subpod in pod['subpods']:
  77. if subpod['plaintext'] != '' and pod_id not in image_pods:
  78. # append unless it's not an actual answer
  79. if subpod['plaintext'] != '(requires interactivity)':
  80. result_chunks.append({'label': pod_title, 'value': subpod['plaintext']})
  81. if pod_is_result or not result_content:
  82. if pod_id != "Input":
  83. result_content = pod_title + ': ' + subpod['plaintext']
  84. elif 'img' in subpod:
  85. result_chunks.append({'label': pod_title, 'image': subpod['img']})
  86. if not result_chunks:
  87. return []
  88. results.append(
  89. {
  90. 'infobox': infobox_title,
  91. 'attributes': result_chunks,
  92. 'urls': [{'title': 'Wolfram|Alpha', 'url': resp.request.headers['Referer']}],
  93. }
  94. )
  95. results.append(
  96. {
  97. 'url': resp.request.headers['Referer'],
  98. 'title': 'Wolfram|Alpha (' + infobox_title + ')',
  99. 'content': result_content,
  100. }
  101. )
  102. return results