rumble.py 2.7 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182
  1. # SPDX-License-Identifier: AGPL-3.0-or-later
  2. """
  3. Rumble (Videos)
  4. """
  5. from urllib.parse import urlencode
  6. from lxml import html
  7. from datetime import datetime
  8. # about
  9. from searx.utils import extract_text
  10. about = {
  11. "website": 'https://rumble.com/',
  12. "wikidata_id": 'Q104765127',
  13. "official_api_documentation": 'https://help.rumble.com/',
  14. "use_official_api": False,
  15. "require_api_key": False,
  16. "results": 'HTML',
  17. }
  18. # engine dependent config
  19. categories = ['videos']
  20. paging = True
  21. # search-url
  22. base_url = 'https://rumble.com'
  23. # https://rumble.com/search/video?q=searx&page=3
  24. search_url = base_url + '/search/video?{query}&page={pageno}'
  25. url_xpath = './/a[@class="video-item--a"]/@href'
  26. thumbnail_xpath = './/img[@class="video-item--img"]/@src'
  27. title_xpath = './/h3[@class="video-item--title"]'
  28. published_date = './/time[@class="video-item--meta video-item--time"]/@datetime'
  29. earned_xpath = './/span[@class="video-item--meta video-item--earned"]/@data-value'
  30. views_xpath = './/span[@class="video-item--meta video-item--views"]/@data-value'
  31. rumbles_xpath = './/span[@class="video-item--meta video-item--rumbles"]/@data-value'
  32. author_xpath = './/div[@class="ellipsis-1"]'
  33. length_xpath = './/span[@class="video-item--duration"]/@data-value'
  34. def request(query, params):
  35. params['url'] = search_url.format(pageno=params['pageno'], query=urlencode({'q': query}))
  36. return params
  37. def response(resp):
  38. results = []
  39. dom = html.fromstring(resp.text)
  40. results_dom = dom.xpath('//li[contains(@class, "video-listing-entry")]')
  41. if not results_dom:
  42. return []
  43. for result_dom in results_dom:
  44. url = base_url + extract_text(result_dom.xpath(url_xpath))
  45. thumbnail = extract_text(result_dom.xpath(thumbnail_xpath))
  46. title = extract_text(result_dom.xpath(title_xpath))
  47. p_date = extract_text(result_dom.xpath(published_date))
  48. # fix offset date for line 644 webapp.py check
  49. fixed_date = datetime.strptime(p_date, '%Y-%m-%dT%H:%M:%S%z')
  50. earned = extract_text(result_dom.xpath(earned_xpath))
  51. views = extract_text(result_dom.xpath(views_xpath))
  52. rumbles = extract_text(result_dom.xpath(rumbles_xpath))
  53. author = extract_text(result_dom.xpath(author_xpath))
  54. length = extract_text(result_dom.xpath(length_xpath))
  55. if earned:
  56. content = f"{views} views - {rumbles} rumbles - ${earned}"
  57. else:
  58. content = f"{views} views - {rumbles} rumbles"
  59. results.append({
  60. 'url': url,
  61. 'title': title,
  62. 'content': content,
  63. 'author': author,
  64. 'length': length,
  65. 'template': 'videos.html',
  66. 'publishedDate': fixed_date,
  67. 'thumbnail': thumbnail,
  68. })
  69. return results