test_command.py 9.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225
  1. # SPDX-License-Identifier: AGPL-3.0-or-later
  2. # pylint: disable=missing-module-docstring,disable=missing-class-docstring,invalid-name
  3. from searx.engines import command as command_engine
  4. from tests import SearxTestCase
  5. class TestCommandEngine(SearxTestCase):
  6. def test_basic_seq_command_engine(self):
  7. ls_engine = command_engine
  8. ls_engine.command = ['seq', '{{QUERY}}']
  9. ls_engine.delimiter = {'chars': ' ', 'keys': ['number']}
  10. expected_results = [
  11. {'number': '1', 'template': 'key-value.html'},
  12. {'number': '2', 'template': 'key-value.html'},
  13. {'number': '3', 'template': 'key-value.html'},
  14. {'number': '4', 'template': 'key-value.html'},
  15. {'number': '5', 'template': 'key-value.html'},
  16. ]
  17. results = ls_engine.search('5', {'pageno': 1})
  18. self.assertEqual(results, expected_results)
  19. def test_delimiter_parsing(self):
  20. searx_logs = '''DEBUG:searx.webapp:static directory is /home/n/p/searx/searx/static
  21. DEBUG:searx.webapp:templates directory is /home/n/p/searx/searx/templates
  22. DEBUG:searx.engines:soundcloud engine: Starting background initialization
  23. DEBUG:searx.engines:wolframalpha engine: Starting background initialization
  24. DEBUG:searx.engines:locate engine: Starting background initialization
  25. DEBUG:searx.engines:regex search in files engine: Starting background initialization
  26. DEBUG:urllib3.connectionpool:Starting new HTTPS connection (1): www.wolframalpha.com
  27. DEBUG:urllib3.connectionpool:Starting new HTTPS connection (1): soundcloud.com
  28. DEBUG:searx.engines:find engine: Starting background initialization
  29. DEBUG:searx.engines:pattern search in files engine: Starting background initialization
  30. DEBUG:searx.webapp:starting webserver on 127.0.0.1:8888
  31. WARNING:werkzeug: * Debugger is active!
  32. INFO:werkzeug: * Debugger PIN: 299-578-362'''
  33. echo_engine = command_engine
  34. echo_engine.command = ['echo', searx_logs]
  35. echo_engine.delimiter = {'chars': ':', 'keys': ['level', 'component', 'message']}
  36. expected_results_by_page = [
  37. [
  38. {
  39. 'component': 'searx.webapp',
  40. 'message': 'static directory is /home/n/p/searx/searx/static',
  41. 'template': 'key-value.html',
  42. 'level': 'DEBUG',
  43. },
  44. {
  45. 'component': 'searx.webapp',
  46. 'message': 'templates directory is /home/n/p/searx/searx/templates',
  47. 'template': 'key-value.html',
  48. 'level': 'DEBUG',
  49. },
  50. {
  51. 'component': 'searx.engines',
  52. 'message': 'soundcloud engine: Starting background initialization',
  53. 'template': 'key-value.html',
  54. 'level': 'DEBUG',
  55. },
  56. {
  57. 'component': 'searx.engines',
  58. 'message': 'wolframalpha engine: Starting background initialization',
  59. 'template': 'key-value.html',
  60. 'level': 'DEBUG',
  61. },
  62. {
  63. 'component': 'searx.engines',
  64. 'message': 'locate engine: Starting background initialization',
  65. 'template': 'key-value.html',
  66. 'level': 'DEBUG',
  67. },
  68. {
  69. 'component': 'searx.engines',
  70. 'message': 'regex search in files engine: Starting background initialization',
  71. 'template': 'key-value.html',
  72. 'level': 'DEBUG',
  73. },
  74. {
  75. 'component': 'urllib3.connectionpool',
  76. 'message': 'Starting new HTTPS connection (1): www.wolframalpha.com',
  77. 'template': 'key-value.html',
  78. 'level': 'DEBUG',
  79. },
  80. {
  81. 'component': 'urllib3.connectionpool',
  82. 'message': 'Starting new HTTPS connection (1): soundcloud.com',
  83. 'template': 'key-value.html',
  84. 'level': 'DEBUG',
  85. },
  86. {
  87. 'component': 'searx.engines',
  88. 'message': 'find engine: Starting background initialization',
  89. 'template': 'key-value.html',
  90. 'level': 'DEBUG',
  91. },
  92. {
  93. 'component': 'searx.engines',
  94. 'message': 'pattern search in files engine: Starting background initialization',
  95. 'template': 'key-value.html',
  96. 'level': 'DEBUG',
  97. },
  98. ],
  99. [
  100. {
  101. 'component': 'searx.webapp',
  102. 'message': 'starting webserver on 127.0.0.1:8888',
  103. 'template': 'key-value.html',
  104. 'level': 'DEBUG',
  105. },
  106. {
  107. 'component': 'werkzeug',
  108. 'message': ' * Debugger is active!',
  109. 'template': 'key-value.html',
  110. 'level': 'WARNING',
  111. },
  112. {
  113. 'component': 'werkzeug',
  114. 'message': ' * Debugger PIN: 299-578-362',
  115. 'template': 'key-value.html',
  116. 'level': 'INFO',
  117. },
  118. ],
  119. ]
  120. for i in [0, 1]:
  121. results = echo_engine.search('', {'pageno': i + 1})
  122. self.assertEqual(results, expected_results_by_page[i])
  123. def test_regex_parsing(self):
  124. txt = '''commit 35f9a8c81d162a361b826bbcd4a1081a4fbe76a7
  125. Author: Noémi Ványi <sitbackandwait@gmail.com>
  126. Date: Tue Oct 15 11:31:33 2019 +0200
  127. first interesting message
  128. commit 6c3c206316153ccc422755512bceaa9ab0b14faa
  129. Author: Noémi Ványi <sitbackandwait@gmail.com>
  130. Date: Mon Oct 14 17:10:08 2019 +0200
  131. second interesting message
  132. commit d8594d2689b4d5e0d2f80250223886c3a1805ef5
  133. Author: Noémi Ványi <sitbackandwait@gmail.com>
  134. Date: Mon Oct 14 14:45:05 2019 +0200
  135. third interesting message
  136. commit '''
  137. git_log_engine = command_engine
  138. git_log_engine.command = ['echo', txt]
  139. git_log_engine.result_separator = '\n\ncommit '
  140. git_log_engine.delimiter = {}
  141. git_log_engine.parse_regex = {
  142. 'commit': r'\w{40}',
  143. 'author': r'[\w* ]* <\w*@?\w*\.?\w*>',
  144. 'date': r'Date: .*',
  145. 'message': r'\n\n.*$',
  146. }
  147. git_log_engine.init({"command": git_log_engine.command, "parse_regex": git_log_engine.parse_regex})
  148. expected_results = [
  149. {
  150. 'commit': '35f9a8c81d162a361b826bbcd4a1081a4fbe76a7',
  151. 'author': ' Noémi Ványi <sitbackandwait@gmail.com>',
  152. 'date': 'Date: Tue Oct 15 11:31:33 2019 +0200',
  153. 'message': '\n\nfirst interesting message',
  154. 'template': 'key-value.html',
  155. },
  156. {
  157. 'commit': '6c3c206316153ccc422755512bceaa9ab0b14faa',
  158. 'author': ' Noémi Ványi <sitbackandwait@gmail.com>',
  159. 'date': 'Date: Mon Oct 14 17:10:08 2019 +0200',
  160. 'message': '\n\nsecond interesting message',
  161. 'template': 'key-value.html',
  162. },
  163. {
  164. 'commit': 'd8594d2689b4d5e0d2f80250223886c3a1805ef5',
  165. 'author': ' Noémi Ványi <sitbackandwait@gmail.com>',
  166. 'date': 'Date: Mon Oct 14 14:45:05 2019 +0200',
  167. 'message': '\n\nthird interesting message',
  168. 'template': 'key-value.html',
  169. },
  170. ]
  171. results = git_log_engine.search('', {'pageno': 1})
  172. self.assertEqual(results, expected_results)
  173. def test_working_dir_path_query(self):
  174. ls_engine = command_engine
  175. ls_engine.command = ['ls', '{{QUERY}}']
  176. ls_engine.result_separator = '\n'
  177. ls_engine.delimiter = {'chars': ' ', 'keys': ['file']}
  178. ls_engine.query_type = 'path'
  179. results = ls_engine.search('.', {'pageno': 1})
  180. self.assertTrue(len(results) != 0)
  181. forbidden_paths = [
  182. '..',
  183. '../..',
  184. './..',
  185. '~',
  186. '/var',
  187. ]
  188. for forbidden_path in forbidden_paths:
  189. self.assertRaises(ValueError, ls_engine.search, forbidden_path, {'pageno': 1})
  190. def test_enum_queries(self):
  191. echo_engine = command_engine
  192. echo_engine.command = ['echo', '{{QUERY}}']
  193. echo_engine.query_type = 'enum'
  194. echo_engine.query_enum = ['i-am-allowed-to-say-this', 'and-that']
  195. for allowed in echo_engine.query_enum:
  196. results = echo_engine.search(allowed, {'pageno': 1})
  197. self.assertTrue(len(results) != 0)
  198. forbidden_queries = [
  199. 'forbidden',
  200. 'banned',
  201. 'prohibited',
  202. ]
  203. for forbidden in forbidden_queries:
  204. self.assertRaises(ValueError, echo_engine.search, forbidden, {'pageno': 1})