Browse Source

[fix] duckduckgo news: unescaped html sequences in description

Bnyro 1 month ago
parent
commit
c28d35c7fc
1 changed files with 2 additions and 2 deletions
  1. 2 2
      searx/engines/duckduckgo_extra.py

+ 2 - 2
searx/engines/duckduckgo_extra.py

@@ -9,7 +9,7 @@ from __future__ import annotations
 from datetime import datetime
 from typing import TYPE_CHECKING
 from urllib.parse import urlencode
-from searx.utils import get_embeded_stream_url
+from searx.utils import get_embeded_stream_url, html_to_text
 
 from searx.engines.duckduckgo import fetch_traits  # pylint: disable=unused-import
 from searx.engines.duckduckgo import get_ddg_lang, get_vqd
@@ -126,7 +126,7 @@ def _news_result(result):
     return {
         'url': result['url'],
         'title': result['title'],
-        'content': result['excerpt'],
+        'content': html_to_text(result['excerpt']),
         'source': result['source'],
         'publishedDate': datetime.fromtimestamp(result['date']),
     }