google_play_apps.py 2.1 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970
  1. # SPDX-License-Identifier: AGPL-3.0-or-later
  2. """
  3. Google Play Apps
  4. """
  5. from urllib.parse import urlencode
  6. from lxml import html
  7. from searx.utils import (
  8. eval_xpath,
  9. extract_url,
  10. extract_text,
  11. eval_xpath_list,
  12. eval_xpath_getindex,
  13. )
  14. about = {
  15. "website": "https://play.google.com/",
  16. "wikidata_id": "Q79576",
  17. "use_official_api": False,
  18. "require_api_key": False,
  19. "results": "HTML",
  20. }
  21. categories = ["files", "apps"]
  22. search_url = "https://play.google.com/store/search?{query}&c=apps&ucbcb=1"
  23. def request(query, params):
  24. params["url"] = search_url.format(query=urlencode({"q": query}))
  25. params['cookies']['CONSENT'] = "YES+"
  26. return params
  27. def response(resp):
  28. results = []
  29. dom = html.fromstring(resp.text)
  30. if eval_xpath(dom, '//div[@class="v6DsQb"]'):
  31. return []
  32. spot = eval_xpath_getindex(dom, '//div[@class="ipRz4"]', 0, None)
  33. if spot is not None:
  34. url = extract_url(eval_xpath(spot, './a[@class="Qfxief"]/@href'), search_url)
  35. title = extract_text(eval_xpath(spot, './/div[@class="vWM94c"]'))
  36. content = extract_text(eval_xpath(spot, './/div[@class="LbQbAe"]'))
  37. img = extract_text(eval_xpath(spot, './/img[@class="T75of bzqKMd"]/@src'))
  38. results.append({"url": url, "title": title, "content": content, "img_src": img})
  39. more = eval_xpath_list(dom, '//c-wiz[@jsrenderer="RBsfwb"]//div[@role="listitem"]', min_len=1)
  40. for result in more:
  41. url = extract_url(eval_xpath(result, ".//a/@href"), search_url)
  42. title = extract_text(eval_xpath(result, './/span[@class="DdYX5"]'))
  43. content = extract_text(eval_xpath(result, './/span[@class="wMUdtb"]'))
  44. img = extract_text(
  45. eval_xpath(
  46. result,
  47. './/img[@class="T75of stzEZd" or @class="T75of etjhNc Q8CSx "]/@src',
  48. )
  49. )
  50. results.append({"url": url, "title": title, "content": content, "img_src": img})
  51. for suggestion in eval_xpath_list(dom, '//c-wiz[@jsrenderer="qyd4Kb"]//div[@class="ULeU3b neq64b"]'):
  52. results.append({"suggestion": extract_text(eval_xpath(suggestion, './/div[@class="Epkrse "]'))})
  53. return results