Browse Source

[enh] Add SepiaSearch engine (#2227)

supported_languages values: see https://framagit.org/framasoft/peertube/search-index/-/blob/master/client/src/views/Search.vue#L618-641
Finn 4 years ago
parent
commit
53c8d945b4
2 changed files with 101 additions and 0 deletions
  1. 97 0
      searx/engines/sepiasearch.py
  2. 4 0
      searx/settings.yml

+ 97 - 0
searx/engines/sepiasearch.py

@@ -0,0 +1,97 @@
+# SepiaSearch (Videos)
+#
+# @website     https://sepiasearch.org
+# @provide-api https://framagit.org/framasoft/peertube/search-index/-/tree/master/server/controllers/api
+# @using-api   yes
+# @results     JSON
+# @stable      yes
+# @parse       url, title, content, publishedDate, thumbnail
+
+from json import loads
+from dateutil import parser, relativedelta
+from urllib.parse import urlencode
+from datetime import datetime
+
+categories = ['videos']
+paging = True
+language_support = True
+time_range_support = True
+safesearch = True
+supported_languages = [
+    'en', 'fr', 'ja', 'eu', 'ca', 'cs', 'eo', 'el',
+    'de', 'it', 'nl', 'es', 'oc', 'gd', 'zh', 'pt',
+    'sv', 'pl', 'fi', 'ru'
+]
+base_url = 'https://sepiasearch.org/api/v1/search/videos'
+
+safesearch_table = {
+    0: 'both',
+    1: 'false',
+    2: 'false'
+}
+
+time_range_table = {
+    'day': relativedelta.relativedelta(),
+    'week': relativedelta.relativedelta(weeks=-1),
+    'month': relativedelta.relativedelta(months=-1),
+    'year': relativedelta.relativedelta(years=-1)
+}
+
+
+embedded_url = '<iframe width="540" height="304" src="{url}" frameborder="0" allowfullscreen></iframe>'
+
+
+def minute_to_hm(minute):
+    if isinstance(minute, int):
+        return "%d:%02d" % (divmod(minute, 60))
+    return None
+
+
+def request(query, params):
+    params['url'] = base_url + '?' + urlencode({
+        'search': query,
+        'start': (params['pageno'] - 1) * 10,
+        'count': 10,
+        'sort': '-match',
+        'nsfw': safesearch_table[params['safesearch']]
+    })
+
+    language = params['language'].split('-')[0]
+    if language in supported_languages:
+        params['url'] += '&languageOneOf[]=' + language
+    if params['time_range'] in time_range_table:
+        time = datetime.now().date() + time_range_table[params['time_range']]
+        params['url'] += '&startDate=' + time.isoformat()
+
+    return params
+
+
+def response(resp):
+    results = []
+
+    search_results = loads(resp.text)
+
+    if 'data' not in search_results:
+        return []
+
+    for result in search_results['data']:
+        title = result['name']
+        content = result['description']
+        thumbnail = result['thumbnailUrl']
+        publishedDate = parser.parse(result['publishedAt'])
+        embedded = embedded_url.format(url=result.get('embedUrl'))
+        author = result.get('account', {}).get('displayName')
+        length = minute_to_hm(result.get('duration'))
+        url = result['url']
+
+        results.append({'url': url,
+                        'title': title,
+                        'content': content,
+                        'author': author,
+                        'length': length,
+                        'template': 'videos.html',
+                        'publishedDate': publishedDate,
+                        'embedded': embedded,
+                        'thumbnail': thumbnail})
+
+    return results

+ 4 - 0
searx/settings.yml

@@ -600,6 +600,10 @@ engines:
 #    engine : scanr_structures
 #    disabled : True
 
+  - name: sepiasearch
+    engine: sepiasearch
+    shortcut: sep
+
   - name : soundcloud
     engine : soundcloud
     shortcut : sc