test_google_news.py 4.3 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697
  1. # -*- coding: utf-8 -*-
  2. from collections import defaultdict
  3. import mock
  4. from searx.engines import google_news
  5. from searx.testing import SearxTestCase
  6. class TestGoogleNewsEngine(SearxTestCase):
  7. def test_request(self):
  8. google_news.supported_languages = ['en-US', 'fr-FR']
  9. google_news.language_aliases = {}
  10. query = 'test_query'
  11. dicto = defaultdict(dict)
  12. dicto['pageno'] = 1
  13. dicto['language'] = 'fr-FR'
  14. dicto['time_range'] = 'w'
  15. params = google_news.request(query, dicto)
  16. self.assertIn('url', params)
  17. self.assertIn(query, params['url'])
  18. self.assertIn('fr', params['url'])
  19. def test_response(self):
  20. self.assertRaises(AttributeError, google_news.response, None)
  21. self.assertRaises(AttributeError, google_news.response, [])
  22. self.assertRaises(AttributeError, google_news.response, '')
  23. self.assertRaises(AttributeError, google_news.response, '[]')
  24. response = mock.Mock(text='{}')
  25. self.assertEqual(google_news.response(response), [])
  26. response = mock.Mock(text='{"data": []}')
  27. self.assertEqual(google_news.response(response), [])
  28. html = u"""
  29. <h2 class="hd">Search Results</h2>
  30. <div data-async-context="query:searx" id="ires">
  31. <div eid="oC2oWcGXCafR6ASkwoCwDA" id="rso">
  32. <div class="_NId">
  33. <!--m-->
  34. <div class="g _cy">
  35. <div class="ts _JGs _JHs _tJs _KGs _jHs">
  36. <div class="_hJs">
  37. <h3 class="r _gJs">
  38. <a class="l lLrAF" href="https://example.com/" onmousedown="return rwt(this,'','','','11','AFQjCNEyehpzD5cJK1KUfXBx9RmsbqqG9g','','0ahUKEwjB58OR54HWAhWnKJoKHSQhAMY4ChCpAggiKAAwAA','','',event)">Example title</a>
  39. </h3>
  40. <div class="slp">
  41. <span class="_OHs _PHs">
  42. Mac &amp; i</span>
  43. <span class="_QGs">
  44. -</span>
  45. <span class="f nsa _QHs">
  46. Mar 21, 2016</span>
  47. </div>
  48. <div class="st">Example description</div>
  49. </div>
  50. </div>
  51. </div>
  52. <div class="g _cy">
  53. <div class="ts _JGs _JHs _oGs _KGs _jHs">
  54. <a class="top _xGs _SHs" href="https://example2.com/" onmousedown="return rwt(this,'','','','12','AFQjCNHObfH7sYmLWI1SC-YhWXKZFRzRjw','','0ahUKEwjB58OR54HWAhWnKJoKHSQhAMY4ChC8iAEIJDAB','','',event)">
  55. <img class="th _RGs" src="https://example2.com/image.jpg" alt="Story image for searx from Golem.de" onload="typeof google==='object'&&google.aft&&google.aft(this)">
  56. </a>
  57. <div class="_hJs">
  58. <h3 class="r _gJs">
  59. <a class="l lLrAF" href="https://example2.com/" onmousedown="return rwt(this,'','','','12','AFQjCNHObfH7sYmLWI1SC-YhWXKZFRzRjw','','0ahUKEwjB58OR54HWAhWnKJoKHSQhAMY4ChCpAgglKAAwAQ','','',event)">Example title 2</a>
  60. </h3>
  61. <div class="slp">
  62. <span class="_OHs _PHs">
  63. Golem.de</span>
  64. <span class="_QGs">
  65. -</span>
  66. <span class="f nsa _QHs">
  67. Oct 4, 2016</span>
  68. </div>
  69. <div class="st">Example description 2</div>
  70. </div>
  71. </div>
  72. </div>
  73. </div>
  74. </div>
  75. </div>
  76. """ # noqa
  77. response = mock.Mock(text=html)
  78. results = google_news.response(response)
  79. self.assertEqual(type(results), list)
  80. self.assertEqual(len(results), 2)
  81. self.assertEqual(results[0]['title'], u'Example title')
  82. self.assertEqual(results[0]['url'], 'https://example.com/')
  83. self.assertEqual(results[0]['content'], 'Example description')
  84. self.assertEqual(results[1]['title'], u'Example title 2')
  85. self.assertEqual(results[1]['url'], 'https://example2.com/')
  86. self.assertEqual(results[1]['content'], 'Example description 2')
  87. self.assertEqual(results[1]['img_src'], 'https://example2.com/image.jpg')