wolframalpha_noapi.py 3.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134
  1. # SPDX-License-Identifier: AGPL-3.0-or-later
  2. """
  3. Wolfram|Alpha (Science)
  4. """
  5. from json import loads
  6. from time import time
  7. from urllib.parse import urlencode
  8. from searx.network import get as http_get
  9. # about
  10. about = {
  11. "website": 'https://www.wolframalpha.com/',
  12. "wikidata_id": 'Q207006',
  13. "official_api_documentation": 'https://products.wolframalpha.com/api/',
  14. "use_official_api": False,
  15. "require_api_key": False,
  16. "results": 'JSON',
  17. }
  18. # search-url
  19. url = 'https://www.wolframalpha.com/'
  20. search_url = (
  21. url + 'input/json.jsp'
  22. '?async=false'
  23. '&banners=raw'
  24. '&debuggingdata=false'
  25. '&format=image,plaintext,imagemap,minput,moutput'
  26. '&formattimeout=2'
  27. '&{query}'
  28. '&output=JSON'
  29. '&parsetimeout=2'
  30. '&proxycode={token}'
  31. '&scantimeout=0.5'
  32. '&sponsorcategories=true'
  33. '&statemethod=deploybutton'
  34. )
  35. referer_url = url + 'input/?{query}'
  36. token = {'value': '', 'last_updated': None}
  37. # pods to display as image in infobox
  38. # this pods do return a plaintext, but they look better and are more useful as images
  39. image_pods = {'VisualRepresentation', 'Illustration', 'Symbol'}
  40. # seems, wolframalpha resets its token in every hour
  41. def obtain_token():
  42. update_time = time() - (time() % 3600)
  43. try:
  44. token_response = http_get('https://www.wolframalpha.com/input/api/v1/code?ts=9999999999999999999', timeout=2.0)
  45. token['value'] = loads(token_response.text)['code']
  46. token['last_updated'] = update_time
  47. except: # pylint: disable=bare-except
  48. pass
  49. return token
  50. def init(engine_settings=None): # pylint: disable=unused-argument
  51. obtain_token()
  52. # do search-request
  53. def request(query, params):
  54. # obtain token if last update was more than an hour
  55. if time() - (token['last_updated'] or 0) > 3600:
  56. obtain_token()
  57. params['url'] = search_url.format(query=urlencode({'input': query}), token=token['value'])
  58. params['headers']['Referer'] = referer_url.format(query=urlencode({'i': query}))
  59. return params
  60. # get response from search-request
  61. def response(resp):
  62. results = []
  63. resp_json = loads(resp.text)
  64. if not resp_json['queryresult']['success']:
  65. return []
  66. # handle resp_json['queryresult']['assumptions']?
  67. result_chunks = []
  68. infobox_title = ""
  69. result_content = ""
  70. for pod in resp_json['queryresult']['pods']:
  71. pod_id = pod.get('id', '')
  72. pod_title = pod.get('title', '')
  73. pod_is_result = pod.get('primary', None)
  74. if 'subpods' not in pod:
  75. continue
  76. if pod_id == 'Input' or not infobox_title:
  77. infobox_title = pod['subpods'][0]['plaintext']
  78. for subpod in pod['subpods']:
  79. if subpod['plaintext'] != '' and pod_id not in image_pods:
  80. # append unless it's not an actual answer
  81. if subpod['plaintext'] != '(requires interactivity)':
  82. result_chunks.append({'label': pod_title, 'value': subpod['plaintext']})
  83. if pod_is_result or not result_content:
  84. if pod_id != "Input":
  85. result_content = pod_title + ': ' + subpod['plaintext']
  86. elif 'img' in subpod:
  87. result_chunks.append({'label': pod_title, 'image': subpod['img']})
  88. if not result_chunks:
  89. return []
  90. results.append(
  91. {
  92. 'infobox': infobox_title,
  93. 'attributes': result_chunks,
  94. 'urls': [{'title': 'Wolfram|Alpha', 'url': resp.request.headers['Referer']}],
  95. }
  96. )
  97. results.append(
  98. {
  99. 'url': resp.request.headers['Referer'],
  100. 'title': 'Wolfram|Alpha (' + infobox_title + ')',
  101. 'content': result_content,
  102. }
  103. )
  104. return results