1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980 |
- # SPDX-License-Identifier: AGPL-3.0-or-later
- """Yep (general, images, news)
- """
- from datetime import datetime
- from urllib.parse import urlencode
- from searx.utils import html_to_text
- about = {
- 'website': 'https://yep.com/',
- 'official_api_documentation': 'https://docs.developer.yelp.com',
- 'use_official_api': False,
- 'require_api_key': False,
- 'results': 'JSON',
- }
- base_url = "https://api.yep.com"
- search_type = "web" # 'web', 'images', 'news'
- safesearch = True
- safesearch_map = {0: 'off', 1: 'moderate', 2: 'strict'}
- def request(query, params):
- args = {
- 'client': 'web',
- 'no_correct': 'false',
- 'q': query,
- 'safeSearch': safesearch_map[params['safesearch']],
- 'type': search_type,
- }
- params['url'] = f"{base_url}/fs/2/search?{urlencode(args)}"
- params['headers']['Referer'] = 'https://yep.com/'
- return params
- def _web_result(result):
- return {
- 'url': result['url'],
- 'title': result['title'],
- 'content': html_to_text(result['snippet']),
- }
- def _images_result(result):
- return {
- 'template': 'images.html',
- 'url': result['host_page'],
- 'title': result.get('title', ''),
- 'content': '',
- 'img_src': result['image_id'],
- 'thumbnail_src': result['src'],
- }
- def _news_result(result):
- return {
- 'url': result['url'],
- 'title': result['title'],
- 'content': html_to_text(result['snippet']),
- 'publishedDate': datetime.strptime(result['first_seen'][:19], '%Y-%m-%dT%H:%M:%S'),
- }
- def response(resp):
- results = []
- for result in resp.json()[1]['results']:
- if search_type == "web":
- if result['type'] != 'Organic':
- continue
- results.append(_web_result(result))
- elif search_type == "images":
- results.append(_images_result(result))
- elif search_type == "news":
- results.append(_news_result(result))
- else:
- raise ValueError(f"Unsupported yep search type: {search_type}")
- return results
|