torrentz.py 2.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100
  1. # SPDX-License-Identifier: AGPL-3.0-or-later
  2. """
  3. Torrentz2.is (BitTorrent meta-search engine)
  4. """
  5. import re
  6. from urllib.parse import urlencode
  7. from lxml import html
  8. from datetime import datetime
  9. from searx.utils import extract_text, get_torrent_size
  10. # about
  11. about = {
  12. "website": 'https://torrentz2.is/',
  13. "wikidata_id": 'Q1156687',
  14. "official_api_documentation": 'https://torrentz.is/torrentz.btsearch',
  15. "use_official_api": False,
  16. "require_api_key": False,
  17. "results": 'HTML',
  18. }
  19. # engine dependent config
  20. categories = ['files', 'videos', 'music']
  21. paging = True
  22. # search-url
  23. # https://torrentz2.is/search?f=EXAMPLE&p=6
  24. base_url = 'https://torrentz2.is/'
  25. search_url = base_url + 'search?{query}'
  26. # do search-request
  27. def request(query, params):
  28. page = params['pageno'] - 1
  29. query = urlencode({'f': query, 'p': page})
  30. params['url'] = search_url.format(query=query)
  31. return params
  32. # get response from search-request
  33. def response(resp):
  34. results = []
  35. dom = html.fromstring(resp.text)
  36. for result in dom.xpath('//div[@class="results"]/dl'):
  37. name_cell = result.xpath('./dt')[0]
  38. title = extract_text(name_cell)
  39. # skip rows that do not contain a link to a torrent
  40. links = name_cell.xpath('./a')
  41. if len(links) != 1:
  42. continue
  43. # extract url and remove a slash in the beginning
  44. link = links[0].attrib.get('href').lstrip('/')
  45. seed = 0
  46. leech = 0
  47. try:
  48. seed = int(result.xpath('./dd/span[4]/text()')[0].replace(',', ''))
  49. leech = int(result.xpath('./dd/span[5]/text()')[0].replace(',', ''))
  50. except:
  51. pass
  52. params = {
  53. 'url': base_url + link,
  54. 'title': title,
  55. 'seed': seed,
  56. 'leech': leech,
  57. 'template': 'torrent.html'
  58. }
  59. # let's try to calculate the torrent size
  60. try:
  61. filesize_info = result.xpath('./dd/span[3]/text()')[0]
  62. filesize, filesize_multiplier = filesize_info.split()
  63. filesize = get_torrent_size(filesize, filesize_multiplier)
  64. params['filesize'] = filesize
  65. except:
  66. pass
  67. # does our link contain a valid SHA1 sum?
  68. if re.compile('[0-9a-fA-F]{40}').match(link):
  69. # add a magnet link to the result
  70. params['magnetlink'] = 'magnet:?xt=urn:btih:' + link
  71. # extract and convert creation date
  72. try:
  73. date_ts = result.xpath('./dd/span[2]')[0].attrib.get('title')
  74. date = datetime.fromtimestamp(float(date_ts))
  75. params['publishedDate'] = date
  76. except:
  77. pass
  78. results.append(params)
  79. return results