1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556 |
- from os.path import realpath, dirname, splitext, join
- from os import listdir
- from imp import load_source
- import grequests
- engine_dir = dirname(realpath(__file__))
- engines = {}
- for filename in listdir(engine_dir):
- modname = splitext(filename)[0]
- if filename.startswith('_') or not filename.endswith('.py'):
- continue
- filepath = join(engine_dir, filename)
- engine = load_source(modname, filepath)
- if not hasattr(engine, 'request') or not hasattr(engine, 'response'):
- continue
- engines[modname] = engine
- def default_request_params():
- return {'method': 'GET', 'headers': {}, 'data': {}, 'url': ''}
- def make_callback(engine_name, results, callback):
- def process_callback(response, **kwargs):
- for result in callback(response):
- result['engine'] = engine_name
- results.append(result)
- return process_callback
- def search(query, request, selected_engines):
- global engines
- requests = []
- results = []
- user_agent = request.headers.get('User-Agent', '')
- for ename, engine in engines.items():
- if ename not in selected_engines:
- continue
- headers = default_request_params()
- headers['User-Agent'] = user_agent
- request_params = engine.request(query, headers)
- callback = make_callback(ename, results, engine.response)
- if request_params['method'] == 'GET':
- req = grequests.get(request_params['url']
- ,headers=headers
- ,hooks=dict(response=callback)
- )
- else:
- req = grequests.post(request_params['url']
- ,data=request_params['data']
- ,headers=headers
- ,hooks=dict(response=callback)
- )
- requests.append(req)
- grequests.map(requests)
- return results
|