Browse Source

[fix] yahoo engine url extraction

Adam Tauber 11 years ago
parent
commit
ee1ffbc87f
2 changed files with 2 additions and 2 deletions
  1. 1 1
      searx/engines/yahoo.py
  2. 1 1
      searx/engines/yahoo_news.py

+ 1 - 1
searx/engines/yahoo.py

@@ -35,7 +35,7 @@ def response(resp):
 
     for result in dom.xpath(results_xpath):
         url_string = extract_url(result.xpath(url_xpath), search_url)
-        start = url_string.find('/RU=')+4
+        start = url_string.find('http', url_string.find('/RU=')+1)
         end = url_string.rfind('/RS')
         url = unquote(url_string[start:end])
         title = extract_text(result.xpath(title_xpath)[0])

+ 1 - 1
searx/engines/yahoo_news.py

@@ -35,7 +35,7 @@ def response(resp):
 
     for result in dom.xpath(results_xpath):
         url_string = extract_url(result.xpath(url_xpath), search_url)
-        start = url_string.find('/RU=')+4
+        start = url_string.find('http', url_string.find('/RU=')+1)
         end = url_string.rfind('/RS')
         url = unquote(url_string[start:end])
         title = extract_text(result.xpath(title_xpath)[0])