unsplash.py 1.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869
  1. # SPDX-License-Identifier: AGPL-3.0-or-later
  2. # lint: pylint
  3. # pylint: disable=missing-function-docstring
  4. """Unsplash
  5. """
  6. from urllib.parse import urlencode, urlparse, urlunparse, parse_qsl
  7. from json import loads
  8. from searx import logger
  9. logger = logger.getChild('unsplash engine')
  10. # about
  11. about = {
  12. "website": 'https://unsplash.com',
  13. "wikidata_id": 'Q28233552',
  14. "official_api_documentation": 'https://unsplash.com/developers',
  15. "use_official_api": False,
  16. "require_api_key": False,
  17. "results": 'JSON',
  18. }
  19. base_url = 'https://unsplash.com/'
  20. search_url = base_url + 'napi/search/photos?'
  21. categories = ['images']
  22. page_size = 20
  23. paging = True
  24. def clean_url(url):
  25. parsed = urlparse(url)
  26. query = [(k, v) for (k, v)
  27. in parse_qsl(parsed.query) if k not in ['ixid', 's']]
  28. return urlunparse((
  29. parsed.scheme,
  30. parsed.netloc,
  31. parsed.path,
  32. parsed.params,
  33. urlencode(query),
  34. parsed.fragment
  35. ))
  36. def request(query, params):
  37. params['url'] = search_url + urlencode({
  38. 'query': query, 'page': params['pageno'], 'per_page': page_size
  39. })
  40. logger.debug("query_url --> %s", params['url'])
  41. return params
  42. def response(resp):
  43. results = []
  44. json_data = loads(resp.text)
  45. if 'results' in json_data:
  46. for result in json_data['results']:
  47. results.append({
  48. 'template': 'images.html',
  49. 'url': clean_url(result['links']['html']),
  50. 'thumbnail_src': clean_url(result['urls']['thumb']),
  51. 'img_src': clean_url(result['urls']['raw']),
  52. 'title': result.get('alt_description') or 'unknown',
  53. 'content': result.get('description') or ''
  54. })
  55. return results