4 years ago · 1d13ad8452
--- a/searx/engines/1337x.py
+++ b/searx/engines/1337x.py
@@ -1,7 +1,21 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															+"""
														
 
															+ 1337x
														
 
															+"""
														
 
															+
														
 
															 from urllib.parse import quote, urljoin
														
 
															 from lxml import html
														
 
															 from searx.utils import extract_text, get_torrent_size, eval_xpath, eval_xpath_list, eval_xpath_getindex
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://1337x.to/',
														
 
															+    "wikidata_id": 'Q28134166',
														
 
															+    "official_api_documentation": None,
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															 url = 'https://1337x.to/'
														
 
															 search_url = url + 'search/{search_term}/{pageno}/'
														
--- a/searx/engines/acgsou.py
+++ b/searx/engines/acgsou.py
@@ -1,18 +1,22 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Acgsou (Japanese Animation/Music/Comics Bittorrent tracker)
														
 
															-
														
 
															- @website      https://www.acgsou.com/
														
 
															- @provide-api  no
														
 
															- @using-api    no
														
 
															- @results      HTML
														
 
															- @stable       no (HTML can change)
														
 
															- @parse        url, title, content, seed, leech, torrentfile
														
 
															 """
														
 
															 from urllib.parse import urlencode
														
 
															 from lxml import html
														
 
															 from searx.utils import extract_text, get_torrent_size, eval_xpath_list, eval_xpath_getindex
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.acgsou.com/',
														
 
															+    "wikidata_id": None,
														
 
															+    "official_api_documentation": None,
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['files', 'images', 'videos', 'music']
														
 
															 paging = True
														
--- a/searx/engines/ahmia.py
+++ b/searx/engines/ahmia.py
@@ -1,19 +1,22 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Ahmia (Onions)
														
 
															-
														
 
															- @website      http://msydqstlz2kzerdg.onion
														
 
															- @provides-api no
														
 
															-
														
 
															- @using-api    no
														
 
															- @results      HTML
														
 
															- @stable       no
														
 
															- @parse        url, title, content
														
 
															 """
														
 
															 from urllib.parse import urlencode, urlparse, parse_qs
														
 
															 from lxml.html import fromstring
														
 
															 from searx.engines.xpath import extract_url, extract_text, eval_xpath_list, eval_xpath
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'http://msydqstlz2kzerdg.onion',
														
 
															+    "wikidata_id": 'Q18693938',
														
 
															+    "official_api_documentation": None,
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 # engine config
														
 
															 categories = ['onions']
														
 
															 paging = True
														
--- a/searx/engines/apkmirror.py
+++ b/searx/engines/apkmirror.py
@@ -1,18 +1,21 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  APK Mirror
														
 
															-
														
 
															- @website     https://www.apkmirror.com
														
 
															-
														
 
															- @using-api   no
														
 
															- @results     HTML
														
 
															- @stable      no (HTML can change)
														
 
															- @parse       url, title, thumbnail_src
														
 
															 """
														
 
															 from urllib.parse import urlencode
														
 
															 from lxml import html
														
 
															 from searx.utils import extract_text, eval_xpath_list, eval_xpath_getindex
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.apkmirror.com',
														
 
															+    "wikidata_id": None,
														
 
															+    "official_api_documentation": None,
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															 # engine dependent config
														
 
															 categories = ['it']
														
--- a/searx/engines/archlinux.py
+++ b/searx/engines/archlinux.py
@@ -1,20 +1,24 @@
 
															-# -*- coding: utf-8 -*-
														
 
															-
														
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Arch Linux Wiki
														
 
															- @website      https://wiki.archlinux.org
														
 
															- @provide-api  no (Mediawiki provides API, but Arch Wiki blocks access to it
														
 
															- @using-api    no
														
 
															- @results      HTML
														
 
															- @stable       no (HTML can change)
														
 
															- @parse        url, title
														
 
															+ API: Mediawiki provides API, but Arch Wiki blocks access to it
														
 
															 """
														
 
															 from urllib.parse import urlencode, urljoin
														
 
															 from lxml import html
														
 
															 from searx.utils import extract_text, eval_xpath_list, eval_xpath_getindex
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://wiki.archlinux.org/',
														
 
															+    "wikidata_id": 'Q101445877',
														
 
															+    "official_api_documentation": None,
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['it']
														
 
															 language_support = True
														
--- a/searx/engines/arxiv.py
+++ b/searx/engines/arxiv.py
@@ -1,20 +1,21 @@
 
															-#!/usr/bin/env python
														
 
															-
														
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  ArXiV (Scientific preprints)
														
 
															- @website     https://arxiv.org
														
 
															- @provide-api yes (export.arxiv.org/api/query)
														
 
															- @using-api   yes
														
 
															- @results     XML-RSS
														
 
															- @stable      yes
														
 
															- @parse       url, title, publishedDate, content
														
 
															- More info on api: https://arxiv.org/help/api/user-manual
														
 
															 """
														
 
															 from lxml import html
														
 
															 from datetime import datetime
														
 
															 from searx.utils import eval_xpath_list, eval_xpath_getindex
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://arxiv.org',
														
 
															+    "wikidata_id": 'Q118398',
														
 
															+    "official_api_documentation": 'https://arxiv.org/help/api',
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'XML-RSS',
														
 
															+}
														
 
															 categories = ['science']
														
 
															 paging = True
														
--- a/searx/engines/base.py
+++ b/searx/engines/base.py
@@ -1,16 +1,6 @@
 
															-#!/usr/bin/env python
														
 
															-
														
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  BASE (Scholar publications)
														
 
															-
														
 
															- @website     https://base-search.net
														
 
															- @provide-api yes with authorization (https://api.base-search.net/)
														
 
															-
														
 
															- @using-api   yes
														
 
															- @results     XML
														
 
															- @stable      ?
														
 
															- @parse       url, title, publishedDate, content
														
 
															- More info on api: http://base-search.net/about/download/base_interface.pdf
														
 
															 """
														
 
															 from urllib.parse import urlencode
														
@@ -19,6 +9,15 @@ from datetime import datetime
 
															 import re
														
 
															 from searx.utils import searx_useragent
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://base-search.net',
														
 
															+    "wikidata_id": 'Q448335',
														
 
															+    "official_api_documentation": 'https://api.base-search.net/',
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'XML',
														
 
															+}
														
 
															 categories = ['science']
														
--- a/searx/engines/bing.py
+++ b/searx/engines/bing.py
@@ -1,16 +1,6 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Bing (Web)
														
 
															-
														
 
															- @website     https://www.bing.com
														
 
															- @provide-api yes (http://datamarket.azure.com/dataset/bing/search),
														
 
															-              max. 5000 query/month
														
 
															-
														
 
															- @using-api   no (because of query limit)
														
 
															- @results     HTML (using search portal)
														
 
															- @stable      no (HTML can change)
														
 
															- @parse       url, title, content
														
 
															-
														
 
															- @todo        publishedDate
														
 
															 """
														
 
															 import re
														
@@ -21,6 +11,16 @@ from searx.utils import eval_xpath, extract_text, match_language
 
															 logger = logger.getChild('bing engine')
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.bing.com',
														
 
															+    "wikidata_id": 'Q182496',
														
 
															+    "official_api_documentation": 'https://www.microsoft.com/en-us/bing/apis/bing-web-search-api',
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['general']
														
 
															 paging = True
														
--- a/searx/engines/bing_images.py
+++ b/searx/engines/bing_images.py
@@ -1,15 +1,6 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Bing (Images)
														
 
															-
														
 
															- @website     https://www.bing.com/images
														
 
															- @provide-api yes (http://datamarket.azure.com/dataset/bing/search),
														
 
															-              max. 5000 query/month
														
 
															-
														
 
															- @using-api   no (because of query limit)
														
 
															- @results     HTML (using search portal)
														
 
															- @stable      no (HTML can change)
														
 
															- @parse       url, title, img_src
														
 
															-
														
 
															 """
														
 
															 from urllib.parse import urlencode
														
@@ -20,6 +11,16 @@ from searx.utils import match_language
 
															 from searx.engines.bing import language_aliases
														
 
															 from searx.engines.bing import _fetch_supported_languages, supported_languages_url  # NOQA # pylint: disable=unused-import
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.bing.com/images',
														
 
															+    "wikidata_id": 'Q182496',
														
 
															+    "official_api_documentation": 'https://www.microsoft.com/en-us/bing/apis/bing-image-search-api',
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['images']
														
 
															 paging = True
														
--- a/searx/engines/bing_news.py
+++ b/searx/engines/bing_news.py
@@ -1,14 +1,6 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Bing (News)
														
 
															-
														
 
															- @website     https://www.bing.com/news
														
 
															- @provide-api yes (http://datamarket.azure.com/dataset/bing/search),
														
 
															-              max. 5000 query/month
														
 
															-
														
 
															- @using-api   no (because of query limit)
														
 
															- @results     RSS (using search portal)
														
 
															- @stable      yes (except perhaps for the images)
														
 
															- @parse       url, title, content, publishedDate, thumbnail
														
 
															 """
														
 
															 from datetime import datetime
														
@@ -20,6 +12,16 @@ from searx.utils import match_language, eval_xpath_getindex
 
															 from searx.engines.bing import language_aliases
														
 
															 from searx.engines.bing import _fetch_supported_languages, supported_languages_url  # NOQA # pylint: disable=unused-import
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.bing.com/news',
														
 
															+    "wikidata_id": 'Q2878637',
														
 
															+    "official_api_documentation": 'https://www.microsoft.com/en-us/bing/apis/bing-news-search-api',
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'RSS',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['news']
														
 
															 paging = True
														
--- a/searx/engines/bing_videos.py
+++ b/searx/engines/bing_videos.py
@@ -1,13 +1,6 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Bing (Videos)
														
 
															-
														
 
															- @website     https://www.bing.com/videos
														
 
															- @provide-api yes (http://datamarket.azure.com/dataset/bing/search)
														
 
															-
														
 
															- @using-api   no
														
 
															- @results     HTML
														
 
															- @stable      no
														
 
															- @parse       url, title, content, thumbnail
														
 
															 """
														
 
															 from json import loads
														
@@ -18,6 +11,16 @@ from searx.utils import match_language
 
															 from searx.engines.bing import language_aliases
														
 
															 from searx.engines.bing import _fetch_supported_languages, supported_languages_url  # NOQA # pylint: disable=unused-import
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.bing.com/videos',
														
 
															+    "wikidata_id": 'Q4914152',
														
 
															+    "official_api_documentation": 'https://www.microsoft.com/en-us/bing/apis/bing-video-search-api',
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 categories = ['videos']
														
 
															 paging = True
														
 
															 safesearch = True
														
--- a/searx/engines/btdigg.py
+++ b/searx/engines/btdigg.py
@@ -1,19 +1,25 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  BTDigg (Videos, Music, Files)
														
 
															-
														
 
															- @website     https://btdig.com
														
 
															- @provide-api yes (on demand)
														
 
															-
														
 
															- @using-api   no
														
 
															- @results     HTML (using search portal)
														
 
															- @stable      no (HTML can change)
														
 
															- @parse       url, title, content, seed, leech, magnetlink
														
 
															 """
														
 
															 from lxml import html
														
 
															 from urllib.parse import quote, urljoin
														
 
															 from searx.utils import extract_text, get_torrent_size
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://btdig.com',
														
 
															+    "wikidata_id": 'Q4836698',
														
 
															+    "official_api_documentation": {
														
 
															+        'url': 'https://btdig.com/contacts',
														
 
															+        'comment': 'on demand'
														
 
															+    },
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['videos', 'music', 'files']
														
 
															 paging = True
														
--- a/searx/engines/command.py
+++ b/searx/engines/command.py
@@ -1,18 +1,7 @@
 
															-'''
														
 
															-searx is free software: you can redistribute it and/or modify
														
 
															-it under the terms of the GNU Affero General Public License as published by
														
 
															-the Free Software Foundation, either version 3 of the License, or
														
 
															-(at your option) any later version.
														
 
															-
														
 
															-searx is distributed in the hope that it will be useful,
														
 
															-but WITHOUT ANY WARRANTY; without even the implied warranty of
														
 
															-MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
														
 
															-GNU Affero General Public License for more details.
														
 
															-
														
 
															-You should have received a copy of the GNU Affero General Public License
														
 
															-along with searx. If not, see < http://www.gnu.org/licenses/ >.
														
 
															-'''
														
 
															-
														
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															+"""
														
 
															+ Command (offline)
														
 
															+"""
														
 
															 import re
														
 
															 from os.path import expanduser, isabs, realpath, commonprefix
														
--- a/searx/engines/currency_convert.py
+++ b/searx/engines/currency_convert.py
@@ -1,5 +1,19 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															+"""
														
 
															+ currency convert (DuckDuckGo)
														
 
															+"""
														
 
															+
														
 
															 import json
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://duckduckgo.com/',
														
 
															+    "wikidata_id": 'Q12805',
														
 
															+    "official_api_documentation": 'https://duckduckgo.com/api',
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSONP',
														
 
															+}
														
 
															 engine_type = 'online_currency'
														
 
															 categories = []
														
--- a/searx/engines/dailymotion.py
+++ b/searx/engines/dailymotion.py
@@ -1,15 +1,6 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Dailymotion (Videos)
														
 
															-
														
 
															- @website     https://www.dailymotion.com
														
 
															- @provide-api yes (http://www.dailymotion.com/developer)
														
 
															-
														
 
															- @using-api   yes
														
 
															- @results     JSON
														
 
															- @stable      yes
														
 
															- @parse       url, title, thumbnail, publishedDate, embedded
														
 
															-
														
 
															- @todo        set content-parameter with correct data
														
 
															 """
														
 
															 from json import loads
														
@@ -17,6 +8,16 @@ from datetime import datetime
 
															 from urllib.parse import urlencode
														
 
															 from searx.utils import match_language, html_to_text
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.dailymotion.com',
														
 
															+    "wikidata_id": 'Q769222',
														
 
															+    "official_api_documentation": 'https://www.dailymotion.com/developer',
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['videos']
														
 
															 paging = True
														
--- a/searx/engines/deezer.py
+++ b/searx/engines/deezer.py
@@ -1,18 +1,21 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Deezer (Music)
														
 
															-
														
 
															- @website     https://deezer.com
														
 
															- @provide-api yes (http://developers.deezer.com/api/)
														
 
															-
														
 
															- @using-api   yes
														
 
															- @results     JSON
														
 
															- @stable      yes
														
 
															- @parse       url, title, content, embedded
														
 
															 """
														
 
															 from json import loads
														
 
															 from urllib.parse import urlencode
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://deezer.com',
														
 
															+    "wikidata_id": 'Q602243',
														
 
															+    "official_api_documentation": 'https://developers.deezer.com/',
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['music']
														
 
															 paging = True
														
--- a/searx/engines/deviantart.py
+++ b/searx/engines/deviantart.py
@@ -1,21 +1,22 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Deviantart (Images)
														
 
															-
														
 
															- @website     https://www.deviantart.com/
														
 
															- @provide-api yes (https://www.deviantart.com/developers/) (RSS)
														
 
															-
														
 
															- @using-api   no (TODO, rewrite to api)
														
 
															- @results     HTML
														
 
															- @stable      no (HTML can change)
														
 
															- @parse       url, title, img_src
														
 
															-
														
 
															- @todo        rewrite to api
														
 
															 """
														
 
															 # pylint: disable=missing-function-docstring
														
 
															 from urllib.parse import urlencode
														
 
															 from lxml import html
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.deviantart.com/',
														
 
															+    "wikidata_id": 'Q46523',
														
 
															+    "official_api_documentation": 'https://www.deviantart.com/developers/',
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['images']
														
 
															 paging = True
														
--- a/searx/engines/dictzone.py
+++ b/searx/engines/dictzone.py
@@ -1,18 +1,21 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Dictzone
														
 
															-
														
 
															- @website     https://dictzone.com/
														
 
															- @provide-api no
														
 
															- @using-api   no
														
 
															- @results     HTML (using search portal)
														
 
															- @stable      no (HTML can change)
														
 
															- @parse       url, title, content
														
 
															 """
														
 
															 from urllib.parse import urljoin
														
 
															 from lxml import html
														
 
															 from searx.utils import eval_xpath
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://dictzone.com/',
														
 
															+    "wikidata_id": None,
														
 
															+    "official_api_documentation": None,
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															 engine_type = 'online_dictionnary'
														
 
															 categories = ['general']
														
--- a/searx/engines/digbt.py
+++ b/searx/engines/digbt.py
@@ -1,19 +1,21 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  DigBT (Videos, Music, Files)
														
 
															-
														
 
															- @website     https://digbt.org
														
 
															- @provide-api no
														
 
															-
														
 
															- @using-api   no
														
 
															- @results     HTML (using search portal)
														
 
															- @stable      no (HTML can change)
														
 
															- @parse       url, title, content, magnetlink
														
 
															 """
														
 
															 from urllib.parse import urljoin
														
 
															 from lxml import html
														
 
															 from searx.utils import extract_text, get_torrent_size
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://digbt.org',
														
 
															+    "wikidata_id": None,
														
 
															+    "official_api_documentation": None,
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															 categories = ['videos', 'music', 'files']
														
 
															 paging = True
														
--- a/searx/engines/digg.py
+++ b/searx/engines/digg.py
@@ -1,13 +1,6 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Digg (News, Social media)
														
 
															-
														
 
															- @website     https://digg.com
														
 
															- @provide-api no
														
 
															-
														
 
															- @using-api   no
														
 
															- @results     HTML (using search portal)
														
 
															- @stable      no (HTML can change)
														
 
															- @parse       url, title, content, publishedDate, thumbnail
														
 
															 """
														
 
															 # pylint: disable=missing-function-docstring
														
@@ -17,6 +10,16 @@ from datetime import datetime
 
															 from lxml import html
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://digg.com',
														
 
															+    "wikidata_id": 'Q270478',
														
 
															+    "official_api_documentation": None,
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['news', 'social media']
														
 
															 paging = True
														
--- a/searx/engines/doku.py
+++ b/searx/engines/doku.py
@@ -1,18 +1,22 @@
 
															-# Doku Wiki
														
 
															-#
														
 
															-# @website     https://www.dokuwiki.org/
														
 
															-# @provide-api yes
														
 
															-#              (https://www.dokuwiki.org/devel:xmlrpc)
														
 
															-#
														
 
															-# @using-api   no
														
 
															-# @results     HTML
														
 
															-# @stable      yes
														
 
															-# @parse       (general)    url, title, content
														
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															+"""
														
 
															+ Doku Wiki
														
 
															+"""
														
 
															 from urllib.parse import urlencode
														
 
															 from lxml.html import fromstring
														
 
															 from searx.utils import extract_text, eval_xpath
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.dokuwiki.org/',
														
 
															+    "wikidata_id": 'Q851864',
														
 
															+    "official_api_documentation": 'https://www.dokuwiki.org/devel:xmlrpc',
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['general']  # TODO , 'images', 'music', 'videos', 'files'
														
 
															 paging = False
														
--- a/searx/engines/duckduckgo.py
+++ b/searx/engines/duckduckgo.py
@@ -1,22 +1,22 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  DuckDuckGo (Web)
														
 
															-
														
 
															- @website     https://duckduckgo.com/
														
 
															- @provide-api yes (https://duckduckgo.com/api),
														
 
															-              but not all results from search-site
														
 
															-
														
 
															- @using-api   no
														
 
															- @results     HTML (using search portal)
														
 
															- @stable      no (HTML can change)
														
 
															- @parse       url, title, content
														
 
															-
														
 
															- @todo        rewrite to api
														
 
															 """
														
 
															 from lxml.html import fromstring
														
 
															 from json import loads
														
 
															 from searx.utils import extract_text, match_language, eval_xpath
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://duckduckgo.com/',
														
 
															+    "wikidata_id": 'Q12805',
														
 
															+    "official_api_documentation": 'https://duckduckgo.com/api',
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['general']
														
 
															 paging = False
														
--- a/searx/engines/duckduckgo_definitions.py
+++ b/searx/engines/duckduckgo_definitions.py
@@ -1,12 +1,6 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															-DuckDuckGo (definitions)
														
 
															-
														
 
															-- `Instant Answer API`_
														
 
															-- `DuckDuckGo query`_
														
 
															-
														
 
															-.. _Instant Answer API: https://duckduckgo.com/api
														
 
															-.. _DuckDuckGo query: https://api.duckduckgo.com/?q=DuckDuckGo&format=json&pretty=1
														
 
															-
														
 
															+ DuckDuckGo (Instant Answer API)
														
 
															 """
														
 
															 import json
														
@@ -22,6 +16,16 @@ from searx.external_urls import get_external_url, get_earth_coordinates_url, are
 
															 logger = logger.getChild('duckduckgo_definitions')
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://duckduckgo.com/',
														
 
															+    "wikidata_id": 'Q12805',
														
 
															+    "official_api_documentation": 'https://duckduckgo.com/api',
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															+
														
 
															 URL = 'https://api.duckduckgo.com/'\
														
 
															     + '?{query}&format=json&pretty=0&no_redirect=1&d=1'
														
--- a/searx/engines/duckduckgo_images.py
+++ b/searx/engines/duckduckgo_images.py
@@ -1,16 +1,6 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  DuckDuckGo (Images)
														
 
															-
														
 
															- @website     https://duckduckgo.com/
														
 
															- @provide-api yes (https://duckduckgo.com/api),
														
 
															-              but images are not supported
														
 
															-
														
 
															- @using-api   no
														
 
															- @results     JSON (site requires js to get images)
														
 
															- @stable      no (JSON can change)
														
 
															- @parse       url, title, img_src
														
 
															-
														
 
															- @todo        avoid extra request
														
 
															 """
														
 
															 from json import loads
														
@@ -20,6 +10,19 @@ from searx.engines.duckduckgo import get_region_code
 
															 from searx.engines.duckduckgo import _fetch_supported_languages, supported_languages_url  # NOQA # pylint: disable=unused-import
														
 
															 from searx.poolrequests import get
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://duckduckgo.com/',
														
 
															+    "wikidata_id": 'Q12805',
														
 
															+    "official_api_documentation": {
														
 
															+        'url': 'https://duckduckgo.com/api',
														
 
															+        'comment': 'but images are not supported',
														
 
															+    },
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON (site requires js to get images)',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['images']
														
 
															 paging = True
														
--- a/searx/engines/duden.py
+++ b/searx/engines/duden.py
@@ -1,11 +1,6 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Duden
														
 
															- @website     https://www.duden.de
														
 
															- @provide-api no
														
 
															- @using-api   no
														
 
															- @results     HTML (using search portal)
														
 
															- @stable      no (HTML can change)
														
 
															- @parse       url, title, content
														
 
															 """
														
 
															 import re
														
@@ -13,6 +8,16 @@ from urllib.parse import quote, urljoin
 
															 from lxml import html
														
 
															 from searx.utils import extract_text, eval_xpath, eval_xpath_list, eval_xpath_getindex
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.duden.de',
														
 
															+    "wikidata_id": 'Q73624591',
														
 
															+    "official_api_documentation": None,
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 categories = ['general']
														
 
															 paging = True
														
 
															 language_support = False
														
--- a/searx/engines/dummy-offline.py
+++ b/searx/engines/dummy-offline.py
@@ -1,11 +1,19 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Dummy Offline
														
 
															-
														
 
															- @results     one result
														
 
															- @stable      yes
														
 
															 """
														
 
															+# about
														
 
															+about = {
														
 
															+    "wikidata_id": None,
														
 
															+    "official_api_documentation": None,
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															+
														
 
															 def search(query, request_params):
														
 
															     return [{
														
 
															         'result': 'this is what you get',
														
--- a/searx/engines/dummy.py
+++ b/searx/engines/dummy.py
@@ -1,10 +1,18 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Dummy
														
 
															-
														
 
															- @results     empty array
														
 
															- @stable      yes
														
 
															 """
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": None,
														
 
															+    "wikidata_id": None,
														
 
															+    "official_api_documentation": None,
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'empty array',
														
 
															+}
														
 
															+
														
 
															 # do search-request
														
 
															 def request(query, params):
														
--- a/searx/engines/ebay.py
+++ b/searx/engines/ebay.py
@@ -1,17 +1,22 @@
 
															-#  Ebay (Videos, Music, Files)
														
 
															-#
														
 
															-# @website     https://www.ebay.com
														
 
															-# @provide-api no (nothing found)
														
 
															-#
														
 
															-# @using-api   no
														
 
															-# @results     HTML (using search portal)
														
 
															-# @stable      yes (HTML can change)
														
 
															-# @parse       url, title, content, price, shipping, source
														
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															+"""
														
 
															+ Ebay (Videos, Music, Files)
														
 
															+"""
														
 
															 from lxml import html
														
 
															 from searx.engines.xpath import extract_text
														
 
															 from urllib.parse import quote
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.ebay.com',
														
 
															+    "wikidata_id": 'Q58024',
														
 
															+    "official_api_documentation": 'https://developer.ebay.com/',
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 categories = ['shopping']
														
 
															 paging = True
														
--- a/searx/engines/elasticsearch.py
+++ b/searx/engines/elasticsearch.py
@@ -1,3 +1,8 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															+"""
														
 
															+ Elasticsearch
														
 
															+"""
														
 
															+
														
 
															 from json import loads, dumps
														
 
															 from requests.auth import HTTPBasicAuth
														
 
															 from searx.exceptions import SearxEngineAPIException
														
--- a/searx/engines/etools.py
+++ b/searx/engines/etools.py
@@ -1,18 +1,22 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  eTools (Web)
														
 
															-
														
 
															- @website      https://www.etools.ch
														
 
															- @provide-api  no
														
 
															- @using-api    no
														
 
															- @results      HTML
														
 
															- @stable       no (HTML can change)
														
 
															- @parse        url, title, content
														
 
															 """
														
 
															 from lxml import html
														
 
															 from urllib.parse import quote
														
 
															 from searx.utils import extract_text, eval_xpath
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.etools.ch',
														
 
															+    "wikidata_id": None,
														
 
															+    "official_api_documentation": None,
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 categories = ['general']
														
 
															 paging = False
														
 
															 language_support = False
														
--- a/searx/engines/fdroid.py
+++ b/searx/engines/fdroid.py
@@ -1,18 +1,22 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  F-Droid (a repository of FOSS applications for Android)
														
 
															-
														
 
															- @website      https://f-droid.org/
														
 
															- @provide-api  no
														
 
															- @using-api    no
														
 
															- @results      HTML
														
 
															- @stable       no (HTML can change)
														
 
															- @parse        url, title, content
														
 
															 """
														
 
															 from urllib.parse import urlencode
														
 
															 from lxml import html
														
 
															 from searx.utils import extract_text
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://f-droid.org/',
														
 
															+    "wikidata_id": 'Q1386210',
														
 
															+    "official_api_documentation": None,
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['files']
														
 
															 paging = True
														
--- a/searx/engines/flickr.py
+++ b/searx/engines/flickr.py
@@ -1,21 +1,23 @@
 
															-#!/usr/bin/env python
														
 
															-
														
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Flickr (Images)
														
 
															- @website     https://www.flickr.com
														
 
															- @provide-api yes (https://secure.flickr.com/services/api/flickr.photos.search.html)
														
 
															-
														
 
															- @using-api   yes
														
 
															- @results     JSON
														
 
															- @stable      yes
														
 
															- @parse       url, title, thumbnail, img_src
														
 
															  More info on api-key : https://www.flickr.com/services/apps/create/
														
 
															 """
														
 
															 from json import loads
														
 
															 from urllib.parse import urlencode
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.flickr.com',
														
 
															+    "wikidata_id": 'Q103204',
														
 
															+    "official_api_documentation": 'https://secure.flickr.com/services/api/flickr.photos.search.html',
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": True,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															+
														
 
															 categories = ['images']
														
 
															 nb_per_page = 15
														
--- a/searx/engines/flickr_noapi.py
+++ b/searx/engines/flickr_noapi.py
@@ -1,15 +1,6 @@
 
															-#!/usr/bin/env python
														
 
															-
														
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															-  Flickr (Images)
														
 
															-
														
 
															- @website     https://www.flickr.com
														
 
															- @provide-api yes (https://secure.flickr.com/services/api/flickr.photos.search.html)
														
 
															-
														
 
															- @using-api   no
														
 
															- @results     HTML
														
 
															- @stable      no
														
 
															- @parse       url, title, thumbnail, img_src
														
 
															+ Flickr (Images)
														
 
															 """
														
 
															 from json import loads
														
@@ -21,6 +12,16 @@ from searx.utils import ecma_unescape, html_to_text
 
															 logger = logger.getChild('flickr-noapi')
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.flickr.com',
														
 
															+    "wikidata_id": 'Q103204',
														
 
															+    "official_api_documentation": 'https://secure.flickr.com/services/api/flickr.photos.search.html',
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 categories = ['images']
														
 
															 url = 'https://www.flickr.com/'
														
--- a/searx/engines/framalibre.py
+++ b/searx/engines/framalibre.py
@@ -1,13 +1,6 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  FramaLibre (It)
														
 
															-
														
 
															- @website     https://framalibre.org/
														
 
															- @provide-api no
														
 
															-
														
 
															- @using-api   no
														
 
															- @results     HTML
														
 
															- @stable      no (HTML can change)
														
 
															- @parse       url, title, content, thumbnail, img_src
														
 
															 """
														
 
															 from html import escape
														
@@ -15,6 +8,16 @@ from urllib.parse import urljoin, urlencode
 
															 from lxml import html
														
 
															 from searx.utils import extract_text
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://framalibre.org/',
														
 
															+    "wikidata_id": 'Q30213882',
														
 
															+    "official_api_documentation": None,
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['it']
														
 
															 paging = True
														
--- a/searx/engines/frinkiac.py
+++ b/searx/engines/frinkiac.py
@@ -1,17 +1,24 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															-Frinkiac (Images)
														
 
															-
														
 
															-@website     https://www.frinkiac.com
														
 
															-@provide-api no
														
 
															-@using-api   no
														
 
															-@results     JSON
														
 
															-@stable      no
														
 
															-@parse       url, title, img_src
														
 
															+ Frinkiac (Images)
														
 
															 """
														
 
															 from json import loads
														
 
															 from urllib.parse import urlencode
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://frinkiac.com',
														
 
															+    "wikidata_id": 'Q24882614',
														
 
															+    "official_api_documentation": {
														
 
															+        'url': None,
														
 
															+        'comment': 'see https://github.com/MitchellAW/CompuGlobal'
														
 
															+    },
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															+
														
 
															 categories = ['images']
														
 
															 BASE = 'https://frinkiac.com/'
														
--- a/searx/engines/genius.py
+++ b/searx/engines/genius.py
@@ -1,19 +1,22 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															-Genius
														
 
															-
														
 
															- @website     https://www.genius.com/
														
 
															- @provide-api yes (https://docs.genius.com/)
														
 
															-
														
 
															- @using-api   yes
														
 
															- @results     JSON
														
 
															- @stable      yes
														
 
															- @parse       url, title, content, thumbnail, publishedDate
														
 
															+ Genius
														
 
															 """
														
 
															 from json import loads
														
 
															 from urllib.parse import urlencode
														
 
															 from datetime import datetime
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://genius.com/',
														
 
															+    "wikidata_id": 'Q3419343',
														
 
															+    "official_api_documentation": 'https://docs.genius.com/',
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['music']
														
 
															 paging = True
														
--- a/searx/engines/gentoo.py
+++ b/searx/engines/gentoo.py
@@ -1,20 +1,22 @@
 
															-# -*- coding: utf-8 -*-
														
 
															-
														
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Gentoo Wiki
														
 
															-
														
 
															- @website      https://wiki.gentoo.org
														
 
															- @provide-api  yes
														
 
															- @using-api    no
														
 
															- @results      HTML
														
 
															- @stable       no (HTML can change)
														
 
															- @parse        url, title
														
 
															 """
														
 
															 from urllib.parse import urlencode, urljoin
														
 
															 from lxml import html
														
 
															 from searx.utils import extract_text
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://wiki.gentoo.org/',
														
 
															+    "wikidata_id": 'Q1050637',
														
 
															+    "official_api_documentation": 'https://wiki.gentoo.org/api.php',
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['it']
														
 
															 language_support = True
														
--- a/searx/engines/gigablast.py
+++ b/searx/engines/gigablast.py
@@ -1,14 +1,6 @@
 
															 # SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Gigablast (Web)
														
 
															-
														
 
															- @website     https://gigablast.com
														
 
															- @provide-api yes (https://gigablast.com/api.html)
														
 
															-
														
 
															- @using-api   yes
														
 
															- @results     XML
														
 
															- @stable      yes
														
 
															- @parse       url, title, content
														
 
															 """
														
 
															 # pylint: disable=missing-function-docstring, invalid-name
														
@@ -18,6 +10,16 @@ from urllib.parse import urlencode
 
															 # from searx import logger
														
 
															 from searx.poolrequests import get
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.gigablast.com',
														
 
															+    "wikidata_id": 'Q3105449',
														
 
															+    "official_api_documentation": 'https://gigablast.com/api.html',
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['general']
														
 
															 # gigablast's pagination is totally damaged, don't use it
														
--- a/searx/engines/github.py
+++ b/searx/engines/github.py
@@ -1,18 +1,21 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															- Github (It)
														
 
															-
														
 
															- @website     https://github.com/
														
 
															- @provide-api yes (https://developer.github.com/v3/)
														
 
															-
														
 
															- @using-api   yes
														
 
															- @results     JSON
														
 
															- @stable      yes (using api)
														
 
															- @parse       url, title, content
														
 
															+ Github (IT)
														
 
															 """
														
 
															 from json import loads
														
 
															 from urllib.parse import urlencode
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://github.com/',
														
 
															+    "wikidata_id": 'Q364',
														
 
															+    "official_api_documentation": 'https://developer.github.com/v3/',
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['it']
														
--- a/searx/engines/google.py
+++ b/searx/engines/google.py
@@ -1,19 +1,11 @@
 
															 # SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """Google (Web)
														
 
															-:website:     https://www.google.com
														
 
															-:provide-api: yes (https://developers.google.com/custom-search/)
														
 
															-:using-api:   not the offical, since it needs registration to another service
														
 
															-:results:     HTML
														
 
															-:stable:      no
														
 
															-:parse:       url, title, content, number_of_results, answer, suggestion, correction
														
 
															-
														
 
															-For detailed description of the *REST-full* API see: `Query Parameter
														
 
															-Definitions`_.
														
 
															-
														
 
															-.. _Query Parameter Definitions:
														
 
															-   https://developers.google.com/custom-search/docs/xml_results#WebSearch_Query_Parameter_Definitions
														
 
															+ For detailed description of the *REST-full* API see: `Query Parameter
														
 
															+ Definitions`_.
														
 
															+ .. _Query Parameter Definitions:
														
 
															+ https://developers.google.com/custom-search/docs/xml_results#WebSearch_Query_Parameter_Definitions
														
 
															 """
														
 
															 # pylint: disable=invalid-name, missing-function-docstring
														
@@ -27,6 +19,16 @@ from searx.exceptions import SearxEngineCaptchaException
 
															 logger = logger.getChild('google engine')
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.google.com',
														
 
															+    "wikidata_id": 'Q9366',
														
 
															+    "official_api_documentation": 'https://developers.google.com/custom-search/',
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['general']
														
 
															 paging = True
														
--- a/searx/engines/google_images.py
+++ b/searx/engines/google_images.py
@@ -1,14 +1,6 @@
 
															 # SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """Google (Images)
														
 
															-:website:     https://images.google.com (redirected to subdomain www.)
														
 
															-:provide-api: yes (https://developers.google.com/custom-search/)
														
 
															-:using-api:   not the offical, since it needs registration to another service
														
 
															-:results:     HTML
														
 
															-:stable:      no
														
 
															-:template:    images.html
														
 
															-:parse:       url, title, content, source, thumbnail_src, img_src
														
 
															-
														
 
															 For detailed description of the *REST-full* API see: `Query Parameter
														
 
															 Definitions`_.
														
@@ -18,10 +10,6 @@ Definitions`_.
 
															    ``data:` scheme).::
														
 
															      Header set Content-Security-Policy "img-src 'self' data: ;"
														
 
															-
														
 
															-.. _Query Parameter Definitions:
														
 
															-   https://developers.google.com/custom-search/docs/xml_results#WebSearch_Query_Parameter_Definitions
														
 
															-
														
 
															 """
														
 
															 from urllib.parse import urlencode, urlparse, unquote
														
@@ -39,6 +27,16 @@ from searx.engines.google import (
 
															 logger = logger.getChild('google images')
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://images.google.com/',
														
 
															+    "wikidata_id": 'Q521550',
														
 
															+    "official_api_documentation": 'https://developers.google.com/custom-search/docs/xml_results#WebSearch_Query_Parameter_Definitions',  # NOQA
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['images']
														
--- a/searx/engines/google_news.py
+++ b/searx/engines/google_news.py
@@ -1,13 +1,6 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Google (News)
														
 
															-
														
 
															- @website     https://news.google.com
														
 
															- @provide-api no
														
 
															-
														
 
															- @using-api   no
														
 
															- @results     HTML
														
 
															- @stable      no
														
 
															- @parse       url, title, content, publishedDate
														
 
															 """
														
 
															 from urllib.parse import urlencode
														
@@ -15,6 +8,16 @@ from lxml import html
 
															 from searx.utils import match_language
														
 
															 from searx.engines.google import _fetch_supported_languages, supported_languages_url  # NOQA # pylint: disable=unused-import
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://news.google.com',
														
 
															+    "wikidata_id": 'Q12020',
														
 
															+    "official_api_documentation": None,
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 # search-url
														
 
															 categories = ['news']
														
 
															 paging = True
														
--- a/searx/engines/google_videos.py
+++ b/searx/engines/google_videos.py
@@ -1,13 +1,6 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Google (Videos)
														
 
															-
														
 
															- @website     https://www.google.com
														
 
															- @provide-api yes (https://developers.google.com/custom-search/)
														
 
															-
														
 
															- @using-api   no
														
 
															- @results     HTML
														
 
															- @stable      no
														
 
															- @parse       url, title, content, thumbnail
														
 
															 """
														
 
															 from datetime import date, timedelta
														
@@ -16,6 +9,16 @@ from lxml import html
 
															 from searx.utils import extract_text, eval_xpath, eval_xpath_list, eval_xpath_getindex
														
 
															 import re
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.google.com',
														
 
															+    "wikidata_id": 'Q219885',
														
 
															+    "official_api_documentation": 'https://developers.google.com/custom-search/',
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['videos']
														
 
															 paging = True
														
--- a/searx/engines/ina.py
+++ b/searx/engines/ina.py
@@ -1,15 +1,7 @@
 
															-#  INA (Videos)
														
 
															-#
														
 
															-# @website     https://www.ina.fr/
														
 
															-# @provide-api no
														
 
															-#
														
 
															-# @using-api   no
														
 
															-# @results     HTML (using search portal)
														
 
															-# @stable      no (HTML can change)
														
 
															-# @parse       url, title, content, publishedDate, thumbnail
														
 
															-#
														
 
															-# @todo        set content-parameter with correct data
														
 
															-# @todo        embedded (needs some md5 from video page)
														
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															+"""
														
 
															+ INA (Videos)
														
 
															+"""
														
 
															 from json import loads
														
 
															 from html import unescape
														
@@ -18,6 +10,15 @@ from lxml import html
 
															 from dateutil import parser
														
 
															 from searx.utils import extract_text
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.ina.fr/',
														
 
															+    "wikidata_id": 'Q1665109',
														
 
															+    "official_api_documentation": None,
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															 # engine dependent config
														
 
															 categories = ['videos']
														
--- a/searx/engines/invidious.py
+++ b/searx/engines/invidious.py
@@ -1,17 +1,22 @@
 
															-# Invidious (Videos)
														
 
															-#
														
 
															-# @website     https://invidio.us/
														
 
															-# @provide-api yes (https://github.com/omarroth/invidious/wiki/API)
														
 
															-#
														
 
															-# @using-api   yes
														
 
															-# @results     JSON
														
 
															-# @stable      yes
														
 
															-# @parse       url, title, content, publishedDate, thumbnail, embedded, author, length
														
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															+"""
														
 
															+ Invidious (Videos)
														
 
															+"""
														
 
															 from urllib.parse import quote_plus
														
 
															 from dateutil import parser
														
 
															 import time
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://instances.invidio.us/',
														
 
															+    "wikidata_id": 'Q79343316',
														
 
															+    "official_api_documentation": 'https://github.com/omarroth/invidious/wiki/API',
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ["videos", "music"]
														
 
															 paging = True
														
--- a/searx/engines/json_engine.py
+++ b/searx/engines/json_engine.py
@@ -1,3 +1,5 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															+
														
 
															 from collections.abc import Iterable
														
 
															 from json import loads
														
 
															 from urllib.parse import urlencode
														
--- a/searx/engines/kickass.py
+++ b/searx/engines/kickass.py
@@ -1,13 +1,6 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Kickass Torrent (Videos, Music, Files)
														
 
															-
														
 
															- @website     https://kickass.so
														
 
															- @provide-api no (nothing found)
														
 
															-
														
 
															- @using-api   no
														
 
															- @results     HTML (using search portal)
														
 
															- @stable      yes (HTML can change)
														
 
															- @parse       url, title, content, seed, leech, magnetlink
														
 
															 """
														
 
															 from lxml import html
														
@@ -15,6 +8,16 @@ from operator import itemgetter
 
															 from urllib.parse import quote, urljoin
														
 
															 from searx.utils import extract_text, get_torrent_size, convert_str_to_int
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://kickass.so',
														
 
															+    "wikidata_id": 'Q17062285',
														
 
															+    "official_api_documentation": None,
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['videos', 'music', 'files']
														
 
															 paging = True
														
--- a/searx/engines/mediawiki.py
+++ b/searx/engines/mediawiki.py
@@ -1,21 +1,22 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															- general mediawiki-engine (Web)
														
 
															-
														
 
															- @website     websites built on mediawiki (https://www.mediawiki.org)
														
 
															- @provide-api yes (http://www.mediawiki.org/wiki/API:Search)
														
 
															-
														
 
															- @using-api   yes
														
 
															- @results     JSON
														
 
															- @stable      yes
														
 
															- @parse       url, title
														
 
															-
														
 
															- @todo        content
														
 
															+ General mediawiki-engine (Web)
														
 
															 """
														
 
															 from json import loads
														
 
															 from string import Formatter
														
 
															 from urllib.parse import urlencode, quote
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": None,
														
 
															+    "wikidata_id": None,
														
 
															+    "official_api_documentation": 'http://www.mediawiki.org/wiki/API:Search',
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['general']
														
 
															 language_support = True
														
--- a/searx/engines/microsoft_academic.py
+++ b/searx/engines/microsoft_academic.py
@@ -1,12 +1,6 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															-Microsoft Academic (Science)
														
 
															-
														
 
															-@website     https://academic.microsoft.com
														
 
															-@provide-api yes
														
 
															-@using-api   no
														
 
															-@results     JSON
														
 
															-@stable      no
														
 
															-@parse       url, title, content
														
 
															+ Microsoft Academic (Science)
														
 
															 """
														
 
															 from datetime import datetime
														
@@ -15,6 +9,16 @@ from uuid import uuid4
 
															 from urllib.parse import urlencode
														
 
															 from searx.utils import html_to_text
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://academic.microsoft.com',
														
 
															+    "wikidata_id": 'Q28136779',
														
 
															+    "official_api_documentation": 'http://ma-graph.org/',
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															+
														
 
															 categories = ['images']
														
 
															 paging = True
														
 
															 result_url = 'https://academic.microsoft.com/api/search/GetEntityResults?{query}'
														
--- a/searx/engines/mixcloud.py
+++ b/searx/engines/mixcloud.py
@@ -1,19 +1,22 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Mixcloud (Music)
														
 
															-
														
 
															- @website     https://http://www.mixcloud.com/
														
 
															- @provide-api yes (http://www.mixcloud.com/developers/
														
 
															-
														
 
															- @using-api   yes
														
 
															- @results     JSON
														
 
															- @stable      yes
														
 
															- @parse       url, title, content, embedded, publishedDate
														
 
															 """
														
 
															 from json import loads
														
 
															 from dateutil import parser
														
 
															 from urllib.parse import urlencode
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.mixcloud.com/',
														
 
															+    "wikidata_id": 'Q6883832',
														
 
															+    "official_api_documentation": 'http://www.mixcloud.com/developers/',
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['music']
														
 
															 paging = True
														
--- a/searx/engines/not_evil.py
+++ b/searx/engines/not_evil.py
@@ -1,19 +1,22 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  not Evil (Onions)
														
 
															-
														
 
															- @website     http://hss3uro2hsxfogfq.onion
														
 
															- @provide-api yes (http://hss3uro2hsxfogfq.onion/api.htm)
														
 
															-
														
 
															- @using-api   no
														
 
															- @results     HTML
														
 
															- @stable      no
														
 
															- @parse       url, title, content
														
 
															 """
														
 
															 from urllib.parse import urlencode
														
 
															 from lxml import html
														
 
															 from searx.engines.xpath import extract_text
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'http://hss3uro2hsxfogfq.onion',
														
 
															+    "wikidata_id": None,
														
 
															+    "official_api_documentation": 'http://hss3uro2hsxfogfq.onion/api.htm',
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['onions']
														
 
															 paging = True
														
--- a/searx/engines/nyaa.py
+++ b/searx/engines/nyaa.py
@@ -1,18 +1,22 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Nyaa.si (Anime Bittorrent tracker)
														
 
															-
														
 
															- @website      https://nyaa.si/
														
 
															- @provide-api  no
														
 
															- @using-api    no
														
 
															- @results      HTML
														
 
															- @stable       no (HTML can change)
														
 
															- @parse        url, title, content, seed, leech, torrentfile
														
 
															 """
														
 
															 from lxml import html
														
 
															 from urllib.parse import urlencode
														
 
															 from searx.utils import extract_text, get_torrent_size, int_or_zero
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://nyaa.si/',
														
 
															+    "wikidata_id": None,
														
 
															+    "official_api_documentation": None,
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['files', 'images', 'videos', 'music']
														
 
															 paging = True
														
--- a/searx/engines/opensemantic.py
+++ b/searx/engines/opensemantic.py
@@ -1,18 +1,22 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															-Open Semantic Search
														
 
															-
														
 
															- @website    https://www.opensemanticsearch.org/
														
 
															- @provide-api yes (https://www.opensemanticsearch.org/dev)
														
 
															-
														
 
															- @using-api  yes
														
 
															- @results    JSON
														
 
															- @stable     yes
														
 
															- @parse      url, title, content, publishedDate
														
 
															+ Open Semantic Search
														
 
															 """
														
 
															+
														
 
															 from dateutil import parser
														
 
															 from json import loads
														
 
															 from urllib.parse import quote
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.opensemanticsearch.org/',
														
 
															+    "wikidata_id": None,
														
 
															+    "official_api_documentation": 'https://www.opensemanticsearch.org/dev',
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															+
														
 
															 base_url = 'http://localhost:8983/solr/opensemanticsearch/'
														
 
															 search_string = 'query?q={query}'
														
--- a/searx/engines/openstreetmap.py
+++ b/searx/engines/openstreetmap.py
@@ -1,19 +1,22 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  OpenStreetMap (Map)
														
 
															-
														
 
															- @website     https://openstreetmap.org/
														
 
															- @provide-api yes (http://wiki.openstreetmap.org/wiki/Nominatim)
														
 
															-
														
 
															- @using-api   yes
														
 
															- @results     JSON
														
 
															- @stable      yes
														
 
															- @parse       url, title
														
 
															 """
														
 
															 import re
														
 
															 from json import loads
														
 
															 from flask_babel import gettext
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.openstreetmap.org/',
														
 
															+    "wikidata_id": 'Q936',
														
 
															+    "official_api_documentation": 'http://wiki.openstreetmap.org/wiki/Nominatim',
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['map']
														
 
															 paging = False
														
--- a/searx/engines/pdbe.py
+++ b/searx/engines/pdbe.py
@@ -1,18 +1,21 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  PDBe (Protein Data Bank in Europe)
														
 
															-
														
 
															- @website       https://www.ebi.ac.uk/pdbe
														
 
															- @provide-api   yes (https://www.ebi.ac.uk/pdbe/api/doc/search.html),
														
 
															-                unlimited
														
 
															- @using-api     yes
														
 
															- @results       python dictionary (from json)
														
 
															- @stable        yes
														
 
															- @parse         url, title, content, img_src
														
 
															 """
														
 
															 from json import loads
														
 
															 from flask_babel import gettext
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.ebi.ac.uk/pdbe',
														
 
															+    "wikidata_id": 'Q55823905',
														
 
															+    "official_api_documentation": 'https://www.ebi.ac.uk/pdbe/api/doc/search.html',
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															+
														
 
															 categories = ['science']
														
 
															 hide_obsolete = False
														
--- a/searx/engines/peertube.py
+++ b/searx/engines/peertube.py
@@ -1,15 +1,6 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  peertube (Videos)
														
 
															-
														
 
															- @website     https://www.peertube.live
														
 
															- @provide-api yes (https://docs.joinpeertube.org/api-rest-reference.html)
														
 
															-
														
 
															- @using-api   yes
														
 
															- @results     JSON
														
 
															- @stable      yes
														
 
															- @parse       url, title, thumbnail, publishedDate, embedded
														
 
															-
														
 
															- @todo        implement time range support
														
 
															 """
														
 
															 from json import loads
														
@@ -17,6 +8,16 @@ from datetime import datetime
 
															 from urllib.parse import urlencode
														
 
															 from searx.utils import html_to_text
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://joinpeertube.org',
														
 
															+    "wikidata_id": 'Q50938515',
														
 
															+    "official_api_documentation": 'https://docs.joinpeertube.org/api-rest-reference.html',
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ["videos"]
														
 
															 paging = True
														
--- a/searx/engines/photon.py
+++ b/searx/engines/photon.py
@@ -1,19 +1,22 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Photon (Map)
														
 
															-
														
 
															- @website     https://photon.komoot.de
														
 
															- @provide-api yes (https://photon.komoot.de/)
														
 
															-
														
 
															- @using-api   yes
														
 
															- @results     JSON
														
 
															- @stable      yes
														
 
															- @parse       url, title
														
 
															 """
														
 
															 from json import loads
														
 
															 from urllib.parse import urlencode
														
 
															 from searx.utils import searx_useragent
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://photon.komoot.de',
														
 
															+    "wikidata_id": None,
														
 
															+    "official_api_documentation": 'https://photon.komoot.de/',
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['map']
														
 
															 paging = False
														
--- a/searx/engines/piratebay.py
+++ b/searx/engines/piratebay.py
@@ -1,12 +1,7 @@
 
															-#  Piratebay (Videos, Music, Files)
														
 
															-#
														
 
															-# @website     https://thepiratebay.org
														
 
															-# @provide-api yes (https://apibay.org/)
														
 
															-#
														
 
															-# @using-api   yes
														
 
															-# @results     JSON
														
 
															-# @stable      no (the API is not documented nor versioned)
														
 
															-# @parse       url, title, seed, leech, magnetlink, filesize, publishedDate
														
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															+"""
														
 
															+ Piratebay (Videos, Music, Files)
														
 
															+"""
														
 
															 from json import loads
														
 
															 from datetime import datetime
														
@@ -15,6 +10,16 @@ from operator import itemgetter
 
															 from urllib.parse import quote
														
 
															 from searx.utils import get_torrent_size
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://thepiratebay.org',
														
 
															+    "wikidata_id": 'Q22663',
														
 
															+    "official_api_documentation": 'https://apibay.org/',
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ["videos", "music", "files"]
														
--- a/searx/engines/pubmed.py
+++ b/searx/engines/pubmed.py
@@ -1,14 +1,6 @@
 
															-#!/usr/bin/env python
														
 
															-
														
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  PubMed (Scholar publications)
														
 
															- @website     https://www.ncbi.nlm.nih.gov/pubmed/
														
 
															- @provide-api yes (https://www.ncbi.nlm.nih.gov/home/develop/api/)
														
 
															- @using-api   yes
														
 
															- @results     XML
														
 
															- @stable      yes
														
 
															- @parse       url, title, publishedDate, content
														
 
															- More info on api: https://www.ncbi.nlm.nih.gov/books/NBK25501/
														
 
															 """
														
 
															 from flask_babel import gettext
														
@@ -17,6 +9,18 @@ from datetime import datetime
 
															 from urllib.parse import urlencode
														
 
															 from searx.poolrequests import get
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.ncbi.nlm.nih.gov/pubmed/',
														
 
															+    "wikidata_id": 'Q1540899',
														
 
															+    "official_api_documentation": {
														
 
															+        'url': 'https://www.ncbi.nlm.nih.gov/home/develop/api/',
														
 
															+        'comment': 'More info on api: https://www.ncbi.nlm.nih.gov/books/NBK25501/'
														
 
															+    },
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'XML',
														
 
															+}
														
 
															 categories = ['science']
														
--- a/searx/engines/qwant.py
+++ b/searx/engines/qwant.py
@@ -1,13 +1,6 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Qwant (Web, Images, News, Social)
														
 
															-
														
 
															- @website     https://qwant.com/
														
 
															- @provide-api not officially (https://api.qwant.com/api/search/)
														
 
															-
														
 
															- @using-api   yes
														
 
															- @results     JSON
														
 
															- @stable      yes
														
 
															- @parse       url, title, content
														
 
															 """
														
 
															 from datetime import datetime
														
@@ -17,6 +10,15 @@ from searx.utils import html_to_text, match_language
 
															 from searx.exceptions import SearxEngineAPIException, SearxEngineCaptchaException
														
 
															 from searx.raise_for_httperror import raise_for_httperror
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.qwant.com/',
														
 
															+    "wikidata_id": 'Q14657870',
														
 
															+    "official_api_documentation": None,
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															 # engine dependent config
														
 
															 categories = []
														
--- a/searx/engines/recoll.py
+++ b/searx/engines/recoll.py
@@ -1,17 +1,22 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Recoll (local search engine)
														
 
															-
														
 
															- @using-api   yes
														
 
															- @results     JSON
														
 
															- @stable      yes
														
 
															- @parse       url, content, size, abstract, author, mtype, subtype, time, \
														
 
															-              filename, label, type, embedded
														
 
															 """
														
 
															 from datetime import date, timedelta
														
 
															 from json import loads
														
 
															 from urllib.parse import urlencode, quote
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": None,
														
 
															+    "wikidata_id": 'Q15735774',
														
 
															+    "official_api_documentation": 'https://www.lesbonscomptes.com/recoll/',
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 time_range_support = True
														
--- a/searx/engines/reddit.py
+++ b/searx/engines/reddit.py
@@ -1,19 +1,22 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Reddit
														
 
															-
														
 
															- @website      https://www.reddit.com/
														
 
															- @provide-api  yes (https://www.reddit.com/dev/api)
														
 
															-
														
 
															- @using-api    yes
														
 
															- @results      JSON
														
 
															- @stable       yes
														
 
															- @parse        url, title, content, thumbnail, publishedDate
														
 
															 """
														
 
															 import json
														
 
															 from datetime import datetime
														
 
															 from urllib.parse import urlencode, urljoin, urlparse
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.reddit.com/',
														
 
															+    "wikidata_id": 'Q1136',
														
 
															+    "official_api_documentation": 'https://www.reddit.com/dev/api',
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['general', 'images', 'news', 'social media']
														
 
															 page_size = 25
														
--- a/searx/engines/scanr_structures.py
+++ b/searx/engines/scanr_structures.py
@@ -1,18 +1,21 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  ScanR Structures (Science)
														
 
															-
														
 
															- @website     https://scanr.enseignementsup-recherche.gouv.fr
														
 
															- @provide-api yes (https://scanr.enseignementsup-recherche.gouv.fr/api/swagger-ui.html)
														
 
															-
														
 
															- @using-api   yes
														
 
															- @results     JSON
														
 
															- @stable      yes
														
 
															- @parse       url, title, content, img_src
														
 
															 """
														
 
															 from json import loads, dumps
														
 
															 from searx.utils import html_to_text
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://scanr.enseignementsup-recherche.gouv.fr',
														
 
															+    "wikidata_id": 'Q44105684',
														
 
															+    "official_api_documentation": 'https://scanr.enseignementsup-recherche.gouv.fr/opendata',
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['science']
														
 
															 paging = True
														
--- a/searx/engines/searchcode_code.py
+++ b/searx/engines/searchcode_code.py
@@ -1,18 +1,20 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															- Searchcode (It)
														
 
															-
														
 
															- @website     https://searchcode.com/
														
 
															- @provide-api yes (https://searchcode.com/api/)
														
 
															-
														
 
															- @using-api   yes
														
 
															- @results     JSON
														
 
															- @stable      yes
														
 
															- @parse       url, title, content
														
 
															+ Searchcode (IT)
														
 
															 """
														
 
															 from json import loads
														
 
															 from urllib.parse import urlencode
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://searchcode.com/',
														
 
															+    "wikidata_id": None,
														
 
															+    "official_api_documentation": 'https://searchcode.com/api/',
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															 # engine dependent config
														
 
															 categories = ['it']
														
--- a/searx/engines/searx_engine.py
+++ b/searx/engines/searx_engine.py
@@ -1,18 +1,20 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Searx (all)
														
 
															-
														
 
															- @website     https://github.com/searx/searx
														
 
															- @provide-api yes (https://searx.github.io/searx/dev/search_api.html)
														
 
															-
														
 
															- @using-api   yes
														
 
															- @results     JSON
														
 
															- @stable      yes (using api)
														
 
															- @parse       url, title, content
														
 
															 """
														
 
															 from json import loads
														
 
															 from searx.engines import categories as searx_categories
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://github.com/searx/searx',
														
 
															+    "wikidata_id": 'Q17639196',
														
 
															+    "official_api_documentation": 'https://searx.github.io/searx/dev/search_api.html',
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															 categories = searx_categories.keys()
														
--- a/searx/engines/sepiasearch.py
+++ b/searx/engines/sepiasearch.py
@@ -1,17 +1,23 @@
 
															-# SepiaSearch (Videos)
														
 
															-#
														
 
															-# @website     https://sepiasearch.org
														
 
															-# @provide-api https://framagit.org/framasoft/peertube/search-index/-/tree/master/server/controllers/api
														
 
															-# @using-api   yes
														
 
															-# @results     JSON
														
 
															-# @stable      yes
														
 
															-# @parse       url, title, content, publishedDate, thumbnail
														
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															+"""
														
 
															+ SepiaSearch (Videos)
														
 
															+"""
														
 
															 from json import loads
														
 
															 from dateutil import parser, relativedelta
														
 
															 from urllib.parse import urlencode
														
 
															 from datetime import datetime
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://sepiasearch.org',
														
 
															+    "wikidata_id": None,
														
 
															+    "official_api_documentation": "https://framagit.org/framasoft/peertube/search-index/-/tree/master/server/controllers/api",  # NOQA
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															+
														
 
															 categories = ['videos']
														
 
															 paging = True
														
 
															 language_support = True
														
--- a/searx/engines/soundcloud.py
+++ b/searx/engines/soundcloud.py
@@ -1,13 +1,6 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Soundcloud (Music)
														
 
															-
														
 
															- @website     https://soundcloud.com
														
 
															- @provide-api yes (https://developers.soundcloud.com/)
														
 
															-
														
 
															- @using-api   yes
														
 
															- @results     JSON
														
 
															- @stable      yes
														
 
															- @parse       url, title, content, publishedDate, embedded
														
 
															 """
														
 
															 import re
														
@@ -18,6 +11,15 @@ from urllib.parse import quote_plus, urlencode
 
															 from searx import logger
														
 
															 from searx.poolrequests import get as http_get
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://soundcloud.com',
														
 
															+    "wikidata_id": 'Q568769',
														
 
															+    "official_api_documentation": 'https://developers.soundcloud.com/',
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															 # engine dependent config
														
 
															 categories = ['music']
														
--- a/searx/engines/spotify.py
+++ b/searx/engines/spotify.py
@@ -1,13 +1,6 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Spotify (Music)
														
 
															-
														
 
															- @website     https://spotify.com
														
 
															- @provide-api yes (https://developer.spotify.com/web-api/search-item/)
														
 
															-
														
 
															- @using-api   yes
														
 
															- @results     JSON
														
 
															- @stable      yes
														
 
															- @parse       url, title, content, embedded
														
 
															 """
														
 
															 from json import loads
														
@@ -15,6 +8,16 @@ from urllib.parse import urlencode
 
															 import requests
														
 
															 import base64
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.spotify.com',
														
 
															+    "wikidata_id": 'Q689141',
														
 
															+    "official_api_documentation": 'https://developer.spotify.com/web-api/search-item/',
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['music']
														
 
															 paging = True
														
--- a/searx/engines/stackoverflow.py
+++ b/searx/engines/stackoverflow.py
@@ -1,13 +1,6 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															- Stackoverflow (It)
														
 
															-
														
 
															- @website     https://stackoverflow.com/
														
 
															- @provide-api not clear (https://api.stackexchange.com/docs/advanced-search)
														
 
															-
														
 
															- @using-api   no
														
 
															- @results     HTML
														
 
															- @stable      no (HTML can change)
														
 
															- @parse       url, title, content
														
 
															+ Stackoverflow (IT)
														
 
															 """
														
 
															 from urllib.parse import urlencode, urljoin, urlparse
														
@@ -15,6 +8,16 @@ from lxml import html
 
															 from searx.utils import extract_text
														
 
															 from searx.exceptions import SearxEngineCaptchaException
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://stackoverflow.com/',
														
 
															+    "wikidata_id": 'Q549037',
														
 
															+    "official_api_documentation": 'https://api.stackexchange.com/docs',
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['it']
														
 
															 paging = True
														
--- a/searx/engines/startpage.py
+++ b/searx/engines/startpage.py
@@ -1,14 +1,7 @@
 
															-#  Startpage (Web)
														
 
															-#
														
 
															-# @website     https://startpage.com
														
 
															-# @provide-api no (nothing found)
														
 
															-#
														
 
															-# @using-api   no
														
 
															-# @results     HTML
														
 
															-# @stable      no (HTML can change)
														
 
															-# @parse       url, title, content
														
 
															-#
														
 
															-# @todo        paging
														
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															+"""
														
 
															+ Startpage (Web)
														
 
															+"""
														
 
															 from lxml import html
														
 
															 from dateutil import parser
														
@@ -19,6 +12,16 @@ from babel import Locale
 
															 from babel.localedata import locale_identifiers
														
 
															 from searx.utils import extract_text, eval_xpath, match_language
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://startpage.com',
														
 
															+    "wikidata_id": 'Q2333295',
														
 
															+    "official_api_documentation": None,
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['general']
														
 
															 # there is a mechanism to block "bot" search
														
--- a/searx/engines/tokyotoshokan.py
+++ b/searx/engines/tokyotoshokan.py
@@ -1,13 +1,6 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Tokyo Toshokan (A BitTorrent Library for Japanese Media)
														
 
															-
														
 
															- @website      https://www.tokyotosho.info/
														
 
															- @provide-api  no
														
 
															- @using-api    no
														
 
															- @results      HTML
														
 
															- @stable       no (HTML can change)
														
 
															- @parse        url, title, publishedDate, seed, leech,
														
 
															-               filesize, magnetlink, content
														
 
															 """
														
 
															 import re
														
@@ -16,6 +9,16 @@ from lxml import html
 
															 from datetime import datetime
														
 
															 from searx.utils import extract_text, get_torrent_size, int_or_zero
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.tokyotosho.info/',
														
 
															+    "wikidata_id": None,
														
 
															+    "official_api_documentation": None,
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['files', 'videos', 'music']
														
 
															 paging = True
														
--- a/searx/engines/torrentz.py
+++ b/searx/engines/torrentz.py
@@ -1,14 +1,6 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Torrentz2.is (BitTorrent meta-search engine)
														
 
															-
														
 
															- @website      https://torrentz2.is/
														
 
															- @provide-api  no
														
 
															-
														
 
															- @using-api    no
														
 
															- @results      HTML
														
 
															- @stable       no (HTML can change, although unlikely,
														
 
															-                   see https://torrentz.is/torrentz.btsearch)
														
 
															- @parse        url, title, publishedDate, seed, leech, filesize, magnetlink
														
 
															 """
														
 
															 import re
														
@@ -17,6 +9,16 @@ from lxml import html
 
															 from datetime import datetime
														
 
															 from searx.utils import extract_text, get_torrent_size
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://torrentz2.is/',
														
 
															+    "wikidata_id": 'Q1156687',
														
 
															+    "official_api_documentation": 'https://torrentz.is/torrentz.btsearch',
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['files', 'videos', 'music']
														
 
															 paging = True
														
--- a/searx/engines/translated.py
+++ b/searx/engines/translated.py
@@ -1,14 +1,18 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  MyMemory Translated
														
 
															-
														
 
															- @website     https://mymemory.translated.net/
														
 
															- @provide-api yes (https://mymemory.translated.net/doc/spec.php)
														
 
															- @using-api   yes
														
 
															- @results     JSON
														
 
															- @stable      yes
														
 
															- @parse       url, title, content
														
 
															 """
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://mymemory.translated.net/',
														
 
															+    "wikidata_id": None,
														
 
															+    "official_api_documentation": 'https://mymemory.translated.net/doc/spec.php',
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															+
														
 
															 engine_type = 'online_dictionnary'
														
 
															 categories = ['general']
														
 
															 url = 'https://api.mymemory.translated.net/get?q={query}&langpair={from_lang}|{to_lang}{key}'
														
--- a/searx/engines/unsplash.py
+++ b/searx/engines/unsplash.py
@@ -1,18 +1,21 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Unsplash
														
 
															-
														
 
															- @website     https://unsplash.com
														
 
															- @provide-api yes (https://unsplash.com/developers)
														
 
															-
														
 
															- @using-api   no
														
 
															- @results     JSON (using search portal's infiniscroll API)
														
 
															- @stable      no (JSON format could change any time)
														
 
															- @parse       url, title, img_src, thumbnail_src
														
 
															 """
														
 
															 from urllib.parse import urlencode, urlparse, urlunparse, parse_qsl
														
 
															 from json import loads
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://unsplash.com',
														
 
															+    "wikidata_id": 'Q28233552',
														
 
															+    "official_api_documentation": 'https://unsplash.com/developers',
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															+
														
 
															 url = 'https://unsplash.com/'
														
 
															 search_url = url + 'napi/search/photos?'
														
 
															 categories = ['images']
														
--- a/searx/engines/vimeo.py
+++ b/searx/engines/vimeo.py
@@ -1,21 +1,22 @@
 
															-#  Vimeo (Videos)
														
 
															-#
														
 
															-# @website     https://vimeo.com/
														
 
															-# @provide-api yes (http://developer.vimeo.com/api),
														
 
															-#              they have a maximum count of queries/hour
														
 
															-#
														
 
															-# @using-api   no (TODO, rewrite to api)
														
 
															-# @results     HTML (using search portal)
														
 
															-# @stable      no (HTML can change)
														
 
															-# @parse       url, title, publishedDate,  thumbnail, embedded
														
 
															-#
														
 
															-# @todo        rewrite to api
														
 
															-# @todo        set content-parameter with correct data
														
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															+"""
														
 
															+ Wikipedia (Web
														
 
															+"""
														
 
															 from urllib.parse import urlencode
														
 
															 from json import loads
														
 
															 from dateutil import parser
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://vimeo.com/',
														
 
															+    "wikidata_id": 'Q156376',
														
 
															+    "official_api_documentation": 'http://developer.vimeo.com/api',
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['videos']
														
 
															 paging = True
														
--- a/searx/engines/wikidata.py
+++ b/searx/engines/wikidata.py
@@ -1,14 +1,6 @@
 
															-# -*- coding: utf-8 -*-
														
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Wikidata
														
 
															-
														
 
															- @website     https://wikidata.org
														
 
															- @provide-api yes (https://query.wikidata.org/)
														
 
															-
														
 
															- @using-api   yes
														
 
															- @results     JSON
														
 
															- @stable      yes
														
 
															- @parse       url, infobox
														
 
															 """
														
@@ -27,6 +19,16 @@ from searx.engines.wikipedia import _fetch_supported_languages, supported_langua
 
															 logger = logger.getChild('wikidata')
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://wikidata.org/',
														
 
															+    "wikidata_id": 'Q2013',
														
 
															+    "official_api_documentation": 'https://query.wikidata.org/',
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															+
														
 
															 # SPARQL
														
 
															 SPARQL_ENDPOINT_URL = 'https://query.wikidata.org/sparql'
														
 
															 SPARQL_EXPLAIN_URL = 'https://query.wikidata.org/bigdata/namespace/wdq/sparql?explain'
														
--- a/searx/engines/wikipedia.py
+++ b/searx/engines/wikipedia.py
@@ -1,13 +1,6 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Wikipedia (Web)
														
 
															-
														
 
															- @website     https://en.wikipedia.org/api/rest_v1/
														
 
															- @provide-api yes
														
 
															-
														
 
															- @using-api   yes
														
 
															- @results     JSON
														
 
															- @stable      yes
														
 
															- @parse       url, infobox
														
 
															 """
														
 
															 from urllib.parse import quote
														
@@ -16,6 +9,16 @@ from lxml.html import fromstring
 
															 from searx.utils import match_language, searx_useragent
														
 
															 from searx.raise_for_httperror import raise_for_httperror
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.wikipedia.org/',
														
 
															+    "wikidata_id": 'Q52',
														
 
															+    "official_api_documentation": 'https://en.wikipedia.org/api/',
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															+
														
 
															 # search-url
														
 
															 search_url = 'https://{language}.wikipedia.org/api/rest_v1/page/summary/{title}'
														
 
															 supported_languages_url = 'https://meta.wikimedia.org/wiki/List_of_Wikipedias'
														
--- a/searx/engines/wolframalpha_api.py
+++ b/searx/engines/wolframalpha_api.py
@@ -1,16 +1,21 @@
 
															-# Wolfram Alpha (Science)
														
 
															-#
														
 
															-# @website     https://www.wolframalpha.com
														
 
															-# @provide-api yes (https://api.wolframalpha.com/v2/)
														
 
															-#
														
 
															-# @using-api   yes
														
 
															-# @results     XML
														
 
															-# @stable      yes
														
 
															-# @parse       url, infobox
														
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															+"""
														
 
															+ Wolfram|Alpha (Science)
														
 
															+"""
														
 
															 from lxml import etree
														
 
															 from urllib.parse import urlencode
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.wolframalpha.com',
														
 
															+    "wikidata_id": 'Q207006',
														
 
															+    "official_api_documentation": 'https://products.wolframalpha.com/api/',
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'XML',
														
 
															+}
														
 
															+
														
 
															 # search-url
														
 
															 search_url = 'https://api.wolframalpha.com/v2/query?appid={api_key}&{query}'
														
 
															 site_url = 'https://www.wolframalpha.com/input/?{query}'
														
--- a/searx/engines/wolframalpha_noapi.py
+++ b/searx/engines/wolframalpha_noapi.py
@@ -1,12 +1,7 @@
 
															-# Wolfram|Alpha (Science)
														
 
															-#
														
 
															-# @website     https://www.wolframalpha.com/
														
 
															-# @provide-api yes (https://api.wolframalpha.com/v2/)
														
 
															-#
														
 
															-# @using-api   no
														
 
															-# @results     JSON
														
 
															-# @stable      no
														
 
															-# @parse       url, infobox
														
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															+"""
														
 
															+ Wolfram|Alpha (Science)
														
 
															+"""
														
 
															 from json import loads
														
 
															 from time import time
														
@@ -14,6 +9,16 @@ from urllib.parse import urlencode
 
															 from searx.poolrequests import get as http_get
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.wolframalpha.com/',
														
 
															+    "wikidata_id": 'Q207006',
														
 
															+    "official_api_documentation": 'https://products.wolframalpha.com/api/',
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															+
														
 
															 # search-url
														
 
															 url = 'https://www.wolframalpha.com/'
														
--- a/searx/engines/www1x.py
+++ b/searx/engines/www1x.py
@@ -1,19 +1,22 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  1x (Images)
														
 
															-
														
 
															- @website     http://1x.com/
														
 
															- @provide-api no
														
 
															-
														
 
															- @using-api   no
														
 
															- @results     HTML
														
 
															- @stable      no (HTML can change)
														
 
															- @parse       url, title, thumbnail
														
 
															 """
														
 
															 from lxml import html, etree
														
 
															 from urllib.parse import urlencode, urljoin
														
 
															 from searx.utils import extract_text, eval_xpath_list, eval_xpath_getindex
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://1x.com/',
														
 
															+    "wikidata_id": None,
														
 
															+    "official_api_documentation": None,
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['images']
														
 
															 paging = False
														
--- a/searx/engines/xpath.py
+++ b/searx/engines/xpath.py
@@ -1,3 +1,5 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															+
														
 
															 from lxml import html
														
 
															 from urllib.parse import urlencode
														
 
															 from searx.utils import extract_text, extract_url, eval_xpath, eval_xpath_list
														
--- a/searx/engines/yacy.py
+++ b/searx/engines/yacy.py
@@ -1,16 +1,7 @@
 
															-# Yacy (Web, Images, Videos, Music, Files)
														
 
															-#
														
 
															-# @website     http://yacy.net
														
 
															-# @provide-api yes
														
 
															-#              (http://www.yacy-websuche.de/wiki/index.php/Dev:APIyacysearch)
														
 
															-#
														
 
															-# @using-api   yes
														
 
															-# @results     JSON
														
 
															-# @stable      yes
														
 
															-# @parse       (general)    url, title, content, publishedDate
														
 
															-# @parse       (images)     url, title, img_src
														
 
															-#
														
 
															-# @todo        parse video, audio and file results
														
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															+"""
														
 
															+ Yacy (Web, Images, Videos, Music, Files)
														
 
															+"""
														
 
															 from json import loads
														
 
															 from dateutil import parser
														
@@ -20,6 +11,16 @@ from requests.auth import HTTPDigestAuth
 
															 from searx.utils import html_to_text
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://yacy.net/',
														
 
															+    "wikidata_id": 'Q1759675',
														
 
															+    "official_api_documentation": 'https://wiki.yacy.net/index.php/Dev:API',
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['general', 'images']  # TODO , 'music', 'videos', 'files'
														
 
															 paging = True
														
--- a/searx/engines/yahoo.py
+++ b/searx/engines/yahoo.py
@@ -1,20 +1,22 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Yahoo (Web)
														
 
															-
														
 
															- @website     https://search.yahoo.com/web
														
 
															- @provide-api yes (https://developer.yahoo.com/boss/search/),
														
 
															-              $0.80/1000 queries
														
 
															-
														
 
															- @using-api   no (because pricing)
														
 
															- @results     HTML (using search portal)
														
 
															- @stable      no (HTML can change)
														
 
															- @parse       url, title, content, suggestion
														
 
															 """
														
 
															 from urllib.parse import unquote, urlencode
														
 
															 from lxml import html
														
 
															 from searx.utils import extract_text, extract_url, match_language, eval_xpath
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://search.yahoo.com/',
														
 
															+    "wikidata_id": None,
														
 
															+    "official_api_documentation": 'https://developer.yahoo.com/api/',
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['general']
														
 
															 paging = True
														
--- a/searx/engines/yahoo_news.py
+++ b/searx/engines/yahoo_news.py
@@ -1,13 +1,7 @@
 
															-# Yahoo (News)
														
 
															-#
														
 
															-# @website     https://news.yahoo.com
														
 
															-# @provide-api yes (https://developer.yahoo.com/boss/search/)
														
 
															-#              $0.80/1000 queries
														
 
															-#
														
 
															-# @using-api   no (because pricing)
														
 
															-# @results     HTML (using search portal)
														
 
															-# @stable      no (HTML can change)
														
 
															-# @parse       url, title, content, publishedDate
														
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															+"""
														
 
															+ Yahoo (News)
														
 
															+"""
														
 
															 import re
														
 
															 from datetime import datetime, timedelta
														
@@ -18,6 +12,16 @@ from searx.engines.yahoo import _fetch_supported_languages, supported_languages_
 
															 from dateutil import parser
														
 
															 from searx.utils import extract_text, extract_url, match_language
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://news.yahoo.com',
														
 
															+    "wikidata_id": 'Q3044717',
														
 
															+    "official_api_documentation": 'https://developer.yahoo.com/api/',
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['news']
														
 
															 paging = True
														
--- a/searx/engines/yandex.py
+++ b/searx/engines/yandex.py
@@ -1,12 +1,6 @@
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															 """
														
 
															  Yahoo (Web)
														
 
															-
														
 
															- @website     https://yandex.ru/
														
 
															- @provide-api ?
														
 
															- @using-api   no
														
 
															- @results     HTML (using search portal)
														
 
															- @stable      no (HTML can change)
														
 
															- @parse       url, title, content
														
 
															 """
														
 
															 from urllib.parse import urlencode, urlparse
														
@@ -16,6 +10,16 @@ from searx.exceptions import SearxEngineCaptchaException
 
															 logger = logger.getChild('yandex engine')
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://yandex.ru/',
														
 
															+    "wikidata_id": 'Q5281',
														
 
															+    "official_api_documentation": "?",
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['general']
														
 
															 paging = True
														
--- a/searx/engines/yggtorrent.py
+++ b/searx/engines/yggtorrent.py
@@ -1,12 +1,7 @@
 
															-#  Yggtorrent (Videos, Music, Files)
														
 
															-#
														
 
															-# @website     https://www2.yggtorrent.si
														
 
															-# @provide-api no (nothing found)
														
 
															-#
														
 
															-# @using-api   no
														
 
															-# @results     HTML (using search portal)
														
 
															-# @stable      no (HTML can change)
														
 
															-# @parse       url, title, seed, leech, publishedDate, filesize
														
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															+"""
														
 
															+ Yggtorrent (Videos, Music, Files)
														
 
															+"""
														
 
															 from lxml import html
														
 
															 from operator import itemgetter
														
@@ -15,6 +10,16 @@ from urllib.parse import quote
 
															 from searx.utils import extract_text, get_torrent_size
														
 
															 from searx.poolrequests import get as http_get
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www2.yggtorrent.si',
														
 
															+    "wikidata_id": None,
														
 
															+    "official_api_documentation": None,
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['videos', 'music', 'files']
														
 
															 paging = True
														
--- a/searx/engines/youtube_api.py
+++ b/searx/engines/youtube_api.py
@@ -1,18 +1,23 @@
 
															-# Youtube (Videos)
														
 
															-#
														
 
															-# @website     https://www.youtube.com/
														
 
															-# @provide-api yes (https://developers.google.com/apis-explorer/#p/youtube/v3/youtube.search.list)
														
 
															-#
														
 
															-# @using-api   yes
														
 
															-# @results     JSON
														
 
															-# @stable      yes
														
 
															-# @parse       url, title, content, publishedDate, thumbnail, embedded
														
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															+"""
														
 
															+ Youtube (Videos)
														
 
															+"""
														
 
															 from json import loads
														
 
															 from dateutil import parser
														
 
															 from urllib.parse import urlencode
														
 
															 from searx.exceptions import SearxEngineAPIException
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.youtube.com/',
														
 
															+    "wikidata_id": 'Q866',
														
 
															+    "official_api_documentation": 'https://developers.google.com/youtube/v3/docs/search/list?apix=true',
														
 
															+    "use_official_api": True,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'JSON',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['videos', 'music']
														
 
															 paging = False
														
--- a/searx/engines/youtube_noapi.py
+++ b/searx/engines/youtube_noapi.py
@@ -1,17 +1,22 @@
 
															-# Youtube (Videos)
														
 
															-#
														
 
															-# @website     https://www.youtube.com/
														
 
															-# @provide-api yes (https://developers.google.com/apis-explorer/#p/youtube/v3/youtube.search.list)
														
 
															-#
														
 
															-# @using-api   no
														
 
															-# @results     HTML
														
 
															-# @stable      no
														
 
															-# @parse       url, title, content, publishedDate, thumbnail, embedded
														
 
															+# SPDX-License-Identifier: AGPL-3.0-or-later
														
 
															+"""
														
 
															+ Youtube (Videos)
														
 
															+"""
														
 
															 from functools import reduce
														
 
															 from json import loads
														
 
															 from urllib.parse import quote_plus
														
 
															+# about
														
 
															+about = {
														
 
															+    "website": 'https://www.youtube.com/',
														
 
															+    "wikidata_id": 'Q866',
														
 
															+    "official_api_documentation": 'https://developers.google.com/youtube/v3/docs/search/list?apix=true',
														
 
															+    "use_official_api": False,
														
 
															+    "require_api_key": False,
														
 
															+    "results": 'HTML',
														
 
															+}
														
 
															+
														
 
															 # engine dependent config
														
 
															 categories = ['videos', 'music']
														
 
															 paging = True
														
--- a/searx/settings.yml
+++ b/searx/settings.yml
@@ -157,6 +157,13 @@ engines:
 
															     timeout : 7.0
														
 
															     disabled : True
														
 
															     shortcut : ai
														
 
															+    about:
														
 
															+      website: https://archive.is/
														
 
															+      wikidata_id: Q13515725
														
 
															+      official_api_documentation: http://mementoweb.org/depot/native/archiveis/
														
 
															+      use_official_api: false
														
 
															+      require_api_key: false
														
 
															+      results: HTML
														
 
															   - name : arxiv
														
 
															     engine : arxiv
														
@@ -201,6 +208,13 @@ engines:
 
															     timeout : 4.0
														
 
															     disabled : True
														
 
															     shortcut : bb
														
 
															+    about:
														
 
															+      website: https://bitbucket.org/
														
 
															+      wikidata_id: Q2493781
														
 
															+      official_api_documentation: https://developer.atlassian.com/bitbucket
														
 
															+      use_official_api: false
														
 
															+      require_api_key: false
														
 
															+      results: HTML
														
 
															   - name : btdigg
														
 
															     engine : btdigg
														
@@ -216,6 +230,13 @@ engines:
 
															     categories : videos
														
 
															     disabled : True
														
 
															     shortcut : c3tv
														
 
															+    about:
														
 
															+      website: https://media.ccc.de/
														
 
															+      wikidata_id: Q80729951
														
 
															+      official_api_documentation: https://github.com/voc/voctoweb
														
 
															+      use_official_api: false
														
 
															+      require_api_key: false
														
 
															+      results: HTML
														
 
															   - name : crossref
														
 
															     engine : json_engine
														
@@ -226,6 +247,13 @@ engines:
 
															     content_query : fullCitation
														
 
															     categories : science
														
 
															     shortcut : cr
														
 
															+    about:
														
 
															+      website: https://www.crossref.org/
														
 
															+      wikidata_id: Q5188229
														
 
															+      official_api_documentation: https://github.com/CrossRef/rest-api-doc
														
 
															+      use_official_api: false
														
 
															+      require_api_key: false
														
 
															+      results: JSON
														
 
															   - name : currency
														
 
															     engine : currency_convert
														
@@ -271,6 +299,13 @@ engines:
 
															     categories : general
														
 
															     shortcut : ew
														
 
															     disabled : True
														
 
															+    about:
														
 
															+      website: https://www.erowid.org/
														
 
															+      wikidata_id: Q1430691
														
 
															+      official_api_documentation:
														
 
															+      use_official_api: false
														
 
															+      require_api_key: false
														
 
															+      results: HTML
														
 
															 #  - name : elasticsearch
														
 
															 #    shortcut : es
														
@@ -321,6 +356,13 @@ engines:
 
															     first_page_num : 1
														
 
															     shortcut : et
														
 
															     disabled : True
														
 
															+    about:
														
 
															+      website: https://www.etymonline.com/
														
 
															+      wikidata_id: Q1188617
														
 
															+      official_api_documentation:
														
 
															+      use_official_api: false
														
 
															+      require_api_key: false
														
 
															+      results: HTML
														
 
															 #  - name : ebay
														
 
															 #    engine : ebay
														
@@ -360,6 +402,9 @@ engines:
 
															     search_type : title
														
 
															     timeout : 5.0
														
 
															     disabled : True
														
 
															+    about:
														
 
															+      website: https://directory.fsf.org/
														
 
															+      wikidata_id: Q2470288
														
 
															   - name : frinkiac
														
 
															     engine : frinkiac
														
@@ -394,6 +439,13 @@ engines:
 
															     shortcut : gl
														
 
															     timeout : 10.0
														
 
															     disabled : True
														
 
															+    about:
														
 
															+      website: https://about.gitlab.com/
														
 
															+      wikidata_id: Q16639197
														
 
															+      official_api_documentation: https://docs.gitlab.com/ee/api/
														
 
															+      use_official_api: false
														
 
															+      require_api_key: false
														
 
															+      results: JSON
														
 
															   - name : github
														
 
															     engine : github
														
@@ -411,6 +463,13 @@ engines:
 
															     categories : it
														
 
															     shortcut : cb
														
 
															     disabled : True
														
 
															+    about:
														
 
															+      website: https://codeberg.org/
														
 
															+      wikidata_id:
														
 
															+      official_api_documentation: https://try.gitea.io/api/swagger
														
 
															+      use_official_api: false
														
 
															+      require_api_key: false
														
 
															+      results: JSON
														
 
															   - name : google
														
 
															     engine : google
														
@@ -441,6 +500,13 @@ engines:
 
															     first_page_num : 0
														
 
															     categories : science
														
 
															     shortcut : gos
														
 
															+    about:
														
 
															+      website: https://scholar.google.com/
														
 
															+      wikidata_id: Q494817
														
 
															+      official_api_documentation:
														
 
															+      use_official_api: false
														
 
															+      require_api_key: false
														
 
															+      results: HTML
														
 
															   - name : google play apps
														
 
															     engine : xpath
														
@@ -453,6 +519,13 @@ engines:
 
															     categories : files
														
 
															     shortcut : gpa
														
 
															     disabled : True
														
 
															+    about:
														
 
															+      website: https://play.google.com/
														
 
															+      wikidata_id: Q79576
														
 
															+      official_api_documentation:
														
 
															+      use_official_api: false
														
 
															+      require_api_key: false
														
 
															+      results: HTML
														
 
															   - name : google play movies
														
 
															     engine : xpath
														
@@ -465,6 +538,13 @@ engines:
 
															     categories : videos
														
 
															     shortcut : gpm
														
 
															     disabled : True
														
 
															+    about:
														
 
															+      website: https://play.google.com/
														
 
															+      wikidata_id: Q79576
														
 
															+      official_api_documentation:
														
 
															+      use_official_api: false
														
 
															+      require_api_key: false
														
 
															+      results: HTML
														
 
															   - name : google play music
														
 
															     engine : xpath
														
@@ -477,6 +557,13 @@ engines:
 
															     categories : music
														
 
															     shortcut : gps
														
 
															     disabled : True
														
 
															+    about:
														
 
															+      website: https://play.google.com/
														
 
															+      wikidata_id: Q79576
														
 
															+      official_api_documentation:
														
 
															+      use_official_api: false
														
 
															+      require_api_key: false
														
 
															+      results: HTML
														
 
															   - name : geektimes
														
 
															     engine : xpath
														
@@ -489,6 +576,13 @@ engines:
 
															     timeout : 4.0
														
 
															     disabled : True
														
 
															     shortcut : gt
														
 
															+    about:
														
 
															+      website: https://geektimes.ru/
														
 
															+      wikidata_id: Q50572423
														
 
															+      official_api_documentation:
														
 
															+      use_official_api: false
														
 
															+      require_api_key: false
														
 
															+      results: HTML
														
 
															   - name : habrahabr
														
 
															     engine : xpath
														
@@ -501,6 +595,13 @@ engines:
 
															     timeout : 4.0
														
 
															     disabled : True
														
 
															     shortcut : habr
														
 
															+    about:
														
 
															+      website: https://habr.com/
														
 
															+      wikidata_id: Q4494434
														
 
															+      official_api_documentation: https://habr.com/en/docs/help/api/
														
 
															+      use_official_api: false
														
 
															+      require_api_key: false
														
 
															+      results: HTML
														
 
															   - name : hoogle
														
 
															     engine : json_engine
														
@@ -513,6 +614,13 @@ engines:
 
															     page_size : 20
														
 
															     categories : it
														
 
															     shortcut : ho
														
 
															+    about:
														
 
															+      website: https://www.haskell.org/
														
 
															+      wikidata_id: Q34010
														
 
															+      official_api_documentation: https://hackage.haskell.org/api
														
 
															+      use_official_api: false
														
 
															+      require_api_key: false
														
 
															+      results: JSON
														
 
															   - name : ina
														
 
															     engine : ina
														
@@ -543,6 +651,13 @@ engines:
 
															     timeout : 7.0
														
 
															     disabled : True
														
 
															     shortcut : lg
														
 
															+    about:
														
 
															+      website: http://libgen.rs/
														
 
															+      wikidata_id: Q22017206
														
 
															+      official_api_documentation:
														
 
															+      use_official_api: false
														
 
															+      require_api_key: false
														
 
															+      results: HTML
														
 
															   - name : lobste.rs
														
 
															     engine : xpath
														
@@ -555,6 +670,13 @@ engines:
 
															     shortcut : lo
														
 
															     timeout : 3.0
														
 
															     disabled: True
														
 
															+    about:
														
 
															+      website: https://lobste.rs/
														
 
															+      wikidata_id: Q60762874
														
 
															+      official_api_documentation:
														
 
															+      use_official_api: false
														
 
															+      require_api_key: false
														
 
															+      results: HTML
														
 
															   - name : metager
														
 
															     engine : xpath
														
@@ -566,6 +688,13 @@ engines:
 
															     categories : general
														
 
															     shortcut : mg
														
 
															     disabled : True
														
 
															+    about:
														
 
															+      website: https://metager.org/
														
 
															+      wikidata_id: Q1924645
														
 
															+      official_api_documentation:
														
 
															+      use_official_api: false
														
 
															+      require_api_key: false
														
 
															+      results: HTML
														
 
															   - name : microsoft academic
														
 
															     engine : microsoft_academic
														
@@ -589,6 +718,13 @@ engines:
 
															     disabled: True
														
 
															     timeout: 5.0
														
 
															     shortcut : npm
														
 
															+    about:
														
 
															+      website: https://npms.io/
														
 
															+      wikidata_id: Q7067518
														
 
															+      official_api_documentation: https://api-docs.npms.io/
														
 
															+      use_official_api: false
														
 
															+      require_api_key: false
														
 
															+      results: JSON
														
 
															 # Requires Tor
														
 
															   - name : not evil
														
@@ -617,6 +753,13 @@ engines:
 
															     categories : science
														
 
															     shortcut : oad
														
 
															     timeout: 5.0
														
 
															+    about:
														
 
															+      website: https://www.openaire.eu/
														
 
															+      wikidata_id: Q25106053
														
 
															+      official_api_documentation: https://api.openaire.eu/
														
 
															+      use_official_api: false
														
 
															+      require_api_key: false
														
 
															+      results: JSON
														
 
															   - name : openairepublications
														
 
															     engine : json_engine
														
@@ -629,6 +772,13 @@ engines:
 
															     categories : science
														
 
															     shortcut : oap
														
 
															     timeout: 5.0
														
 
															+    about:
														
 
															+      website: https://www.openaire.eu/
														
 
															+      wikidata_id: Q25106053
														
 
															+      official_api_documentation: https://api.openaire.eu/
														
 
															+      use_official_api: false
														
 
															+      require_api_key: false
														
 
															+      results: JSON
														
 
															 #  - name : opensemanticsearch
														
 
															 #    engine : opensemantic
														
@@ -650,6 +800,13 @@ engines:
 
															     timeout : 4.0
														
 
															     disabled : True
														
 
															     shortcut : or
														
 
															+    about:
														
 
															+      website: https://openrepos.net/
														
 
															+      wikidata_id:
														
 
															+      official_api_documentation:
														
 
															+      use_official_api: false
														
 
															+      require_api_key: false
														
 
															+      results: HTML
														
 
															   - name : pdbe
														
 
															     engine : pdbe
														
@@ -768,6 +925,13 @@ engines:
 
															     content_xpath : .//div[@class="search-result-abstract"]
														
 
															     shortcut : se
														
 
															     categories : science
														
 
															+    about:
														
 
															+      website: https://www.semanticscholar.org/
														
 
															+      wikidata_id: Q22908627
														
 
															+      official_api_documentation: https://api.semanticscholar.org/
														
 
															+      use_official_api: false
														
 
															+      require_api_key: false
														
 
															+      results: HTML
														
 
															 # Spotify needs API credentials
														
 
															 #  - name : spotify
														
@@ -876,6 +1040,9 @@ engines:
 
															     number_of_results : 5
														
 
															     search_type : text
														
 
															     disabled : True
														
 
															+    about:
														
 
															+      website: https://www.wikibooks.org/
														
 
															+      wikidata_id: Q367
														
 
															   - name : wikinews
														
 
															     engine : mediawiki
														
@@ -885,6 +1052,9 @@ engines:
 
															     number_of_results : 5
														
 
															     search_type : text
														
 
															     disabled : True
														
 
															+    about:
														
 
															+      website: https://www.wikinews.org/
														
 
															+      wikidata_id: Q964
														
 
															   - name : wikiquote
														
 
															     engine : mediawiki
														
@@ -896,6 +1066,9 @@ engines:
 
															     disabled : True
														
 
															     additional_tests:
														
 
															       rosebud: *test_rosebud
														
 
															+    about:
														
 
															+      website: https://www.wikiquote.org/
														
 
															+      wikidata_id: Q369
														
 
															   - name : wikisource
														
 
															     engine : mediawiki
														
@@ -905,6 +1078,9 @@ engines:
 
															     number_of_results : 5
														
 
															     search_type : text
														
 
															     disabled : True
														
 
															+    about:
														
 
															+      website: https://www.wikisource.org/
														
 
															+      wikidata_id: Q263
														
 
															   - name : wiktionary
														
 
															     engine : mediawiki
														
@@ -914,6 +1090,9 @@ engines:
 
															     number_of_results : 5
														
 
															     search_type : text
														
 
															     disabled : True
														
 
															+    about:
														
 
															+      website: https://www.wiktionary.org/
														
 
															+      wikidata_id: Q151
														
 
															   - name : wikiversity
														
 
															     engine : mediawiki
														
@@ -923,6 +1102,9 @@ engines:
 
															     number_of_results : 5
														
 
															     search_type : text
														
 
															     disabled : True
														
 
															+    about:
														
 
															+      website: https://www.wikiversity.org/
														
 
															+      wikidata_id: Q370
														
 
															   - name : wikivoyage
														
 
															     engine : mediawiki
														
@@ -932,6 +1114,9 @@ engines:
 
															     number_of_results : 5
														
 
															     search_type : text
														
 
															     disabled : True
														
 
															+    about:
														
 
															+      website: https://www.wikivoyage.org/
														
 
															+      wikidata_id: Q373
														
 
															   - name : wolframalpha
														
 
															     shortcut : wa
														
@@ -979,6 +1164,13 @@ engines:
 
															     first_page_num : 0
														
 
															     page_size : 10
														
 
															     disabled : True
														
 
															+    about:
														
 
															+      website: https://www.seznam.cz/
														
 
															+      wikidata_id: Q3490485
														
 
															+      official_api_documentation: https://api.sklik.cz/
														
 
															+      use_official_api: false
														
 
															+      require_api_key: false
														
 
															+      results: HTML
														
 
															   - name : mojeek
														
 
															     shortcut: mjk
														
@@ -993,6 +1185,13 @@ engines:
 
															     first_page_num : 0
														
 
															     page_size : 10
														
 
															     disabled : True
														
 
															+    about:
														
 
															+      website: https://www.mojeek.com/
														
 
															+      wikidata_id: Q60747299
														
 
															+      official_api_documentation: https://www.mojeek.com/services/api.html/
														
 
															+      use_official_api: false
														
 
															+      require_api_key: false
														
 
															+      results: HTML
														
 
															   - name : naver
														
 
															     shortcut: nvr
														
@@ -1007,6 +1206,13 @@ engines:
 
															     first_page_num : 1
														
 
															     page_size : 10
														
 
															     disabled : True
														
 
															+    about:
														
 
															+      website: https://www.naver.com/
														
 
															+      wikidata_id: Q485639
														
 
															+      official_api_documentation: https://developers.naver.com/docs/nmt/examples/
														
 
															+      use_official_api: false
														
 
															+      require_api_key: false
														
 
															+      results: HTML
														
 
															   - name : rubygems
														
 
															     shortcut: rbg
														
@@ -1021,6 +1227,13 @@ engines:
 
															     first_page_num : 1
														
 
															     categories: it
														
 
															     disabled : True
														
 
															+    about:
														
 
															+      website: https://rubygems.org/
														
 
															+      wikidata_id: Q1853420
														
 
															+      official_api_documentation: https://guides.rubygems.org/rubygems-org-api/
														
 
															+      use_official_api: false
														
 
															+      require_api_key: false
														
 
															+      results: HTML
														
 
															   - name : peertube
														
 
															     engine: peertube
														
--- a/utils/fetch_engine_descriptions.py
+++ b/utils/fetch_engine_descriptions.py
@@ -0,0 +1,206 @@
 
															+#!/usr/bin/env python
														
 
															+
														
 
															+import sys
														
 
															+import json
														
 
															+from urllib.parse import quote, urlparse
														
 
															+from os.path import realpath, dirname
														
 
															+import cld3
														
 
															+from lxml.html import fromstring
														
 
															+
														
 
															+# set path
														
 
															+sys.path.append(realpath(dirname(realpath(__file__)) + '/../'))
														
 
															+
														
 
															+from searx.engines.wikidata import send_wikidata_query
														
 
															+from searx.utils import extract_text
														
 
															+import searx
														
 
															+import searx.search
														
 
															+import searx.poolrequests
														
 
															+
														
 
															+SPARQL_WIKIPEDIA_ARTICLE = """
														
 
															+SELECT DISTINCT ?item ?name
														
 
															+WHERE {
														
 
															+  VALUES ?item { %IDS% }
														
 
															+  ?article schema:about ?item ;
														
 
															+              schema:inLanguage ?lang ;
														
 
															+              schema:name ?name ;
														
 
															+              schema:isPartOf [ wikibase:wikiGroup "wikipedia" ] .
														
 
															+  FILTER(?lang in (%LANGUAGES_SPARQL%)) .
														
 
															+  FILTER (!CONTAINS(?name, ':')) .
														
 
															+}
														
 
															+"""
														
 
															+
														
 
															+SPARQL_DESCRIPTION = """
														
 
															+SELECT DISTINCT ?item ?itemDescription
														
 
															+WHERE {
														
 
															+  VALUES ?item { %IDS% }
														
 
															+  ?item schema:description ?itemDescription .
														
 
															+  FILTER (lang(?itemDescription) in (%LANGUAGES_SPARQL%))
														
 
															+}
														
 
															+ORDER BY ?itemLang
														
 
															+"""
														
 
															+
														
 
															+LANGUAGES = searx.settings['locales'].keys()
														
 
															+LANGUAGES_SPARQL = ', '.join(set(map(lambda l: repr(l.split('_')[0]), LANGUAGES)))
														
 
															+IDS = None
														
 
															+
														
 
															+descriptions = {}
														
 
															+wd_to_engine_name = {}
														
 
															+
														
 
															+
														
 
															+def normalize_description(description):
														
 
															+    for c in [chr(c) for c in range(0, 31)]:
														
 
															+        description = description.replace(c, ' ')
														
 
															+    description = ' '.join(description.strip().split())
														
 
															+    return description
														
 
															+
														
 
															+
														
 
															+def update_description(engine_name, lang, description, source, replace=True):
														
 
															+    if replace or lang not in descriptions[engine_name]:
														
 
															+        descriptions[engine_name][lang] = [normalize_description(description), source]
														
 
															+
														
 
															+
														
 
															+def get_wikipedia_summary(language, pageid):
														
 
															+    search_url = 'https://{language}.wikipedia.org/api/rest_v1/page/summary/{title}'
														
 
															+    url = search_url.format(title=quote(pageid), language=language)
														
 
															+    try:
														
 
															+        response = searx.poolrequests.get(url)
														
 
															+        response.raise_for_status()
														
 
															+        api_result = json.loads(response.text)
														
 
															+        return api_result.get('extract')
														
 
															+    except:
														
 
															+        return None
														
 
															+
														
 
															+
														
 
															+def detect_language(text):
														
 
															+    r = cld3.get_language(str(text))  # pylint: disable=E1101
														
 
															+    if r is not None and r.probability >= 0.98 and r.is_reliable:
														
 
															+        return r.language
														
 
															+    return None
														
 
															+
														
 
															+
														
 
															+def get_website_description(url, lang1, lang2=None):
														
 
															+    headers = {
														
 
															+        'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:84.0) Gecko/20100101 Firefox/84.0',
														
 
															+        'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8',
														
 
															+        'DNT': '1',
														
 
															+        'Upgrade-Insecure-Requests': '1',
														
 
															+        'Sec-GPC': '1',
														
 
															+        'Cache-Control': 'max-age=0',
														
 
															+    }
														
 
															+    if lang1 is not None:
														
 
															+        lang_list = [lang1]
														
 
															+        if lang2 is not None:
														
 
															+            lang_list.append(lang2)
														
 
															+        headers['Accept-Language'] = f'{",".join(lang_list)};q=0.8'
														
 
															+    try:
														
 
															+        response = searx.poolrequests.get(url, headers=headers, timeout=10)
														
 
															+        response.raise_for_status()
														
 
															+    except Exception:
														
 
															+        return (None, None)
														
 
															+
														
 
															+    try:
														
 
															+        html = fromstring(response.text)
														
 
															+    except ValueError:
														
 
															+        html = fromstring(response.content)
														
 
															+
														
 
															+    description = extract_text(html.xpath('/html/head/meta[@name="description"]/@content'))
														
 
															+    if not description:
														
 
															+        description = extract_text(html.xpath('/html/head/meta[@property="og:description"]/@content'))
														
 
															+    if not description:
														
 
															+        description = extract_text(html.xpath('/html/head/title'))
														
 
															+    lang = extract_text(html.xpath('/html/@lang'))
														
 
															+    if lang is None and len(lang1) > 0:
														
 
															+        lang = lang1
														
 
															+    lang = detect_language(description) or lang or 'en'
														
 
															+    lang = lang.split('_')[0]
														
 
															+    lang = lang.split('-')[0]
														
 
															+    return (lang, description)
														
 
															+
														
 
															+
														
 
															+def initialize():
														
 
															+    global descriptions, wd_to_engine_name, IDS
														
 
															+    searx.search.initialize()
														
 
															+    for engine_name, engine in searx.engines.engines.items():
														
 
															+        descriptions[engine_name] = {}
														
 
															+        wikidata_id = getattr(engine, "about", {}).get('wikidata_id')
														
 
															+        if wikidata_id is not None:
														
 
															+            wd_to_engine_name.setdefault(wikidata_id, set()).add(engine_name)
														
 
															+
														
 
															+    IDS = ' '.join(list(map(lambda wd_id: 'wd:' + wd_id, wd_to_engine_name.keys())))
														
 
															+
														
 
															+
														
 
															+def fetch_wikidata_descriptions():
														
 
															+    global IDS
														
 
															+    result = send_wikidata_query(SPARQL_DESCRIPTION
														
 
															+                                 .replace('%IDS%', IDS)
														
 
															+                                 .replace('%LANGUAGES_SPARQL%', LANGUAGES_SPARQL))
														
 
															+    if result is not None:
														
 
															+        for binding in result['results']['bindings']:
														
 
															+            wikidata_id = binding['item']['value'].replace('http://www.wikidata.org/entity/', '')
														
 
															+            lang = binding['itemDescription']['xml:lang']
														
 
															+            description = binding['itemDescription']['value']
														
 
															+            if ' ' in description:  # skip unique word description (like "website")
														
 
															+                for engine_name in wd_to_engine_name[wikidata_id]:
														
 
															+                    update_description(engine_name, lang, description, 'wikidata')
														
 
															+
														
 
															+
														
 
															+def fetch_wikipedia_descriptions():
														
 
															+    global IDS
														
 
															+    result = send_wikidata_query(SPARQL_WIKIPEDIA_ARTICLE
														
 
															+                                 .replace('%IDS%', IDS)
														
 
															+                                 .replace('%LANGUAGES_SPARQL%', LANGUAGES_SPARQL))
														
 
															+    if result is not None:
														
 
															+        for binding in result['results']['bindings']:
														
 
															+            wikidata_id = binding['item']['value'].replace('http://www.wikidata.org/entity/', '')
														
 
															+            lang = binding['name']['xml:lang']
														
 
															+            pageid = binding['name']['value']
														
 
															+            description = get_wikipedia_summary(lang, pageid)
														
 
															+            if description is not None and ' ' in description:
														
 
															+                for engine_name in wd_to_engine_name[wikidata_id]:
														
 
															+                    update_description(engine_name, lang, description, 'wikipedia')
														
 
															+
														
 
															+
														
 
															+def normalize_url(url):
														
 
															+    url = url.replace('{language}', 'en')
														
 
															+    url = urlparse(url)._replace(path='/', params='', query='', fragment='').geturl()
														
 
															+    url = url.replace('https://api.', 'https://')
														
 
															+    return url
														
 
															+
														
 
															+
														
 
															+def fetch_website_description(engine_name, website):
														
 
															+    default_lang, default_description = get_website_description(website, None, None)
														
 
															+    if default_lang is None or default_description is None:
														
 
															+        return
														
 
															+    if default_lang not in descriptions[engine_name]:
														
 
															+        descriptions[engine_name][default_lang] = [normalize_description(default_description), website]
														
 
															+    for request_lang in ('en-US', 'es-US', 'fr-FR', 'zh', 'ja', 'ru', 'ar', 'ko'):
														
 
															+        if request_lang.split('-')[0] not in descriptions[engine_name]:
														
 
															+            lang, desc = get_website_description(website, request_lang, request_lang.split('-')[0])
														
 
															+            if desc is not None and desc != default_description:
														
 
															+                update_description(engine_name, lang, desc, website, replace=False)
														
 
															+            else:
														
 
															+                break
														
 
															+
														
 
															+
														
 
															+def fetch_website_descriptions():
														
 
															+    for engine_name, engine in searx.engines.engines.items():
														
 
															+        website = getattr(engine, "about", {}).get('website')
														
 
															+        if website is None:
														
 
															+            website = normalize_url(getattr(engine, "search_url"))
														
 
															+        if website is None:
														
 
															+            website = normalize_url(getattr(engine, "base_url"))
														
 
															+        if website is not None:
														
 
															+            fetch_website_description(engine_name, website)
														
 
															+
														
 
															+
														
 
															+def main():
														
 
															+    initialize()
														
 
															+    fetch_wikidata_descriptions()
														
 
															+    fetch_wikipedia_descriptions()
														
 
															+    fetch_website_descriptions()
														
 
															+
														
 
															+    sys.stdout.write(json.dumps(descriptions, indent=1, separators=(',', ':'), ensure_ascii=False))
														
 
															+
														
 
															+
														
 
															+if __name__ == "__main__":
														
 
															+    main()