Browse Source

[fix] remove html tags from qwant results

Adam Tauber 8 years ago
parent
commit
c3dcebb778
1 changed files with 6 additions and 4 deletions
  1. 6 4
      searx/engines/qwant.py

+ 6 - 4
searx/engines/qwant.py

@@ -10,9 +10,11 @@
  @parse       url, title, content
 """
 
-from urllib import urlencode
-from json import loads
 from datetime import datetime
+from json import loads
+from urllib import urlencode
+
+from searx.utils import html_to_text
 
 # engine dependent config
 categories = None
@@ -66,9 +68,9 @@ def response(resp):
     # parse results
     for result in res.get('items', {}):
 
-        title = result['title']
+        title = html_to_text(result['title'])
         res_url = result['url']
-        content = result['desc']
+        content = html_to_text(result['desc'])
 
         if category_to_keyword.get(categories[0], '') == 'web':
             results.append({'title': title,