yep.py 2.0 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980
  1. # SPDX-License-Identifier: AGPL-3.0-or-later
  2. """Yep (general, images, news)
  3. """
  4. from datetime import datetime
  5. from urllib.parse import urlencode
  6. from searx.utils import html_to_text
  7. about = {
  8. 'website': 'https://yep.com/',
  9. 'official_api_documentation': 'https://docs.developer.yelp.com',
  10. 'use_official_api': False,
  11. 'require_api_key': False,
  12. 'results': 'JSON',
  13. }
  14. base_url = "https://api.yep.com"
  15. search_type = "web" # 'web', 'images', 'news'
  16. safesearch = True
  17. safesearch_map = {0: 'off', 1: 'moderate', 2: 'strict'}
  18. def request(query, params):
  19. args = {
  20. 'client': 'web',
  21. 'no_correct': 'false',
  22. 'q': query,
  23. 'safeSearch': safesearch_map[params['safesearch']],
  24. 'type': search_type,
  25. }
  26. params['url'] = f"{base_url}/fs/2/search?{urlencode(args)}"
  27. params['headers']['Referer'] = 'https://yep.com/'
  28. return params
  29. def _web_result(result):
  30. return {
  31. 'url': result['url'],
  32. 'title': result['title'],
  33. 'content': html_to_text(result['snippet']),
  34. }
  35. def _images_result(result):
  36. return {
  37. 'template': 'images.html',
  38. 'url': result['host_page'],
  39. 'title': result.get('title', ''),
  40. 'content': '',
  41. 'img_src': result['image_id'],
  42. 'thumbnail_src': result['src'],
  43. }
  44. def _news_result(result):
  45. return {
  46. 'url': result['url'],
  47. 'title': result['title'],
  48. 'content': html_to_text(result['snippet']),
  49. 'publishedDate': datetime.strptime(result['first_seen'][:19], '%Y-%m-%dT%H:%M:%S'),
  50. }
  51. def response(resp):
  52. results = []
  53. for result in resp.json()[1]['results']:
  54. if search_type == "web":
  55. if result['type'] != 'Organic':
  56. continue
  57. results.append(_web_result(result))
  58. elif search_type == "images":
  59. results.append(_images_result(result))
  60. elif search_type == "news":
  61. results.append(_news_result(result))
  62. else:
  63. raise ValueError(f"Unsupported yep search type: {search_type}")
  64. return results