google_news.py 1.3 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344
  1. #!/usr/bin/env python
  2. from urllib import urlencode
  3. from json import loads
  4. from dateutil import parser
  5. from datetime import datetime
  6. categories = ['news']
  7. url = 'https://ajax.googleapis.com/'
  8. search_url = url + 'ajax/services/search/news?v=2.0&start={offset}&rsz=large&safe=off&filter=off&{query}&hl={language}' # noqa
  9. paging = True
  10. language_support = True
  11. def request(query, params):
  12. offset = (params['pageno'] - 1) * 8
  13. language = 'en-US'
  14. if params['language'] != 'all':
  15. language = params['language'].replace('_', '-')
  16. params['url'] = search_url.format(offset=offset,
  17. query=urlencode({'q': query}),
  18. language=language)
  19. return params
  20. def response(resp):
  21. results = []
  22. search_res = loads(resp.text)
  23. if not search_res.get('responseData', {}).get('results'):
  24. return []
  25. for result in search_res['responseData']['results']:
  26. # Mon, 10 Mar 2014 16:26:15 -0700
  27. publishedDate = parser.parse(result['publishedDate'])
  28. results.append({'url': result['unescapedUrl'],
  29. 'title': result['titleNoFormatting'],
  30. 'publishedDate': publishedDate,
  31. 'content': result['content']})
  32. return results