peertube.py 3.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101
  1. # SPDX-License-Identifier: AGPL-3.0-or-later
  2. """
  3. peertube (Videos)
  4. """
  5. from json import loads
  6. from datetime import datetime
  7. from urllib.parse import urlencode
  8. from searx.utils import html_to_text
  9. # about
  10. about = {
  11. "website": 'https://joinpeertube.org',
  12. "wikidata_id": 'Q50938515',
  13. "official_api_documentation": 'https://docs.joinpeertube.org/api-rest-reference.html',
  14. "use_official_api": True,
  15. "require_api_key": False,
  16. "results": 'JSON',
  17. }
  18. # engine dependent config
  19. categories = ["videos"]
  20. paging = True
  21. base_url = "https://peer.tube"
  22. supported_languages_url = (
  23. 'https://framagit.org/framasoft/peertube/search-index/-/raw/master/client/src/views/Search.vue'
  24. )
  25. # do search-request
  26. def request(query, params):
  27. sanitized_url = base_url.rstrip("/")
  28. pageno = (params["pageno"] - 1) * 15
  29. search_url = sanitized_url + "/api/v1/search/videos/?pageno={pageno}&{query}"
  30. query_dict = {"search": query}
  31. language = params["language"].split("-")[0]
  32. if "all" != language and language in supported_languages:
  33. query_dict["languageOneOf"] = language
  34. params["url"] = search_url.format(
  35. query=urlencode(query_dict), pageno=pageno
  36. )
  37. return params
  38. def _get_offset_from_pageno(pageno):
  39. return (pageno - 1) * 15 + 1
  40. # get response from search-request
  41. def response(resp):
  42. sanitized_url = base_url.rstrip("/")
  43. results = []
  44. search_res = loads(resp.text)
  45. embedded_url = (
  46. '<iframe width="560" height="315" sandbox="allow-same-origin allow-scripts allow-popups" '
  47. + 'src="'
  48. + sanitized_url
  49. + '{embed_path}" frameborder="0" allowfullscreen></iframe>'
  50. )
  51. # return empty array if there are no results
  52. if "data" not in search_res:
  53. return []
  54. # parse results
  55. for res in search_res["data"]:
  56. title = res["name"]
  57. url = sanitized_url + "/videos/watch/" + res["uuid"]
  58. description = res["description"]
  59. if description:
  60. content = html_to_text(res["description"])
  61. else:
  62. content = ""
  63. thumbnail = sanitized_url + res["thumbnailPath"]
  64. publishedDate = datetime.strptime(res["publishedAt"], "%Y-%m-%dT%H:%M:%S.%fZ")
  65. embedded = embedded_url.format(embed_path=res["embedPath"])
  66. results.append(
  67. {
  68. "template": "videos.html",
  69. "url": url,
  70. "title": title,
  71. "content": content,
  72. "publishedDate": publishedDate,
  73. "embedded": embedded,
  74. "thumbnail": thumbnail,
  75. }
  76. )
  77. # return results
  78. return results
  79. def _fetch_supported_languages(resp):
  80. import re
  81. # https://docs.python.org/3/howto/regex.html#greedy-versus-non-greedy
  82. videolanguages = re.search(r"videoLanguages \(\)[^\n]+(.*?)\]", resp.text, re.DOTALL)
  83. peertube_languages = [m.group(1) for m in re.finditer(r"\{ id: '([a-z]+)', label:", videolanguages.group(1))]
  84. return peertube_languages