solidtorrents.py 2.2 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485
  1. # SPDX-License-Identifier: AGPL-3.0-or-later
  2. # lint: pylint
  3. """SolidTorrents
  4. """
  5. from datetime import datetime
  6. from urllib.parse import urlencode
  7. import random
  8. from lxml import html
  9. from searx.utils import extract_text, eval_xpath, eval_xpath_getindex
  10. about = {
  11. "website": 'https://www.solidtorrents.net/',
  12. "wikidata_id": None,
  13. "official_api_documentation": None,
  14. "use_official_api": False,
  15. "require_api_key": False,
  16. "results": 'HTML',
  17. }
  18. categories = ['files']
  19. paging = True
  20. base_url = ''
  21. base_url_rand = ''
  22. units = {"B": 1, "KB": 2 ** 10, "MB": 2 ** 20, "GB": 2 ** 30, "TB": 2 ** 40}
  23. def size2int(size_str):
  24. n, u = size_str.split()
  25. return int(float(n.strip()) * units[u.strip()])
  26. def request(query, params):
  27. global base_url_rand # pylint: disable=global-statement
  28. if isinstance(base_url, list):
  29. base_url_rand = random.choice(base_url)
  30. else:
  31. base_url_rand = base_url
  32. search_url = base_url_rand + '/search?{query}'
  33. page = (params['pageno'] - 1) * 20
  34. query = urlencode({'q': query, 'page': page})
  35. params['url'] = search_url.format(query=query)
  36. return params
  37. def response(resp):
  38. results = []
  39. dom = html.fromstring(resp.text)
  40. for result in eval_xpath(dom, '//div[contains(@class, "search-result")]'):
  41. a = eval_xpath_getindex(result, './div/h5/a', 0, None)
  42. if a is None:
  43. continue
  44. title = extract_text(a)
  45. url = eval_xpath_getindex(a, '@href', 0, None)
  46. stats = eval_xpath(result, './div//div[contains(@class, "stats")]/div')
  47. filesize = size2int(extract_text(stats[1]))
  48. leech = extract_text(stats[2])
  49. seed = extract_text(stats[3])
  50. magnet = eval_xpath_getindex(result, './div//a[contains(@class, "dl-magnet")]/@href', 0, None)
  51. params = {
  52. 'seed': seed,
  53. 'leech': leech,
  54. 'title': title,
  55. 'url': base_url_rand + url,
  56. 'filesize': filesize,
  57. 'magnetlink': magnet,
  58. 'template': "torrent.html",
  59. }
  60. date_str = extract_text(stats[4])
  61. try:
  62. params['publishedDate'] = datetime.strptime(date_str, '%b %d, %Y')
  63. except ValueError:
  64. pass
  65. results.append(params)
  66. return results