youtube.py 2.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384
  1. ## Youtube (Videos)
  2. #
  3. # @website https://www.youtube.com/
  4. # @provide-api yes (http://gdata-samples-youtube-search-py.appspot.com/)
  5. #
  6. # @using-api yes
  7. # @results JSON
  8. # @stable yes
  9. # @parse url, title, content, publishedDate, thumbnail
  10. from json import loads
  11. from urllib import urlencode
  12. from dateutil import parser
  13. # engine dependent config
  14. categories = ['videos', 'music']
  15. paging = True
  16. language_support = True
  17. # search-url
  18. base_url = 'https://gdata.youtube.com/feeds/api/videos'
  19. search_url = base_url + '?alt=json&{query}&start-index={index}&max-results=5' # noqa
  20. # do search-request
  21. def request(query, params):
  22. index = (params['pageno'] - 1) * 5 + 1
  23. params['url'] = search_url.format(query=urlencode({'q': query}),
  24. index=index)
  25. # add language tag if specified
  26. if params['language'] != 'all':
  27. params['url'] += '&lr=' + params['language'].split('_')[0]
  28. return params
  29. # get response from search-request
  30. def response(resp):
  31. results = []
  32. search_results = loads(resp.text)
  33. # return empty array if there are no results
  34. if not 'feed' in search_results:
  35. return []
  36. feed = search_results['feed']
  37. # parse results
  38. for result in feed['entry']:
  39. url = [x['href'] for x in result['link'] if x['type'] == 'text/html']
  40. if not url:
  41. return
  42. # remove tracking
  43. url = url[0].replace('feature=youtube_gdata', '')
  44. if url.endswith('&'):
  45. url = url[:-1]
  46. title = result['title']['$t']
  47. content = ''
  48. thumbnail = ''
  49. pubdate = result['published']['$t']
  50. publishedDate = parser.parse(pubdate)
  51. if result['media$group']['media$thumbnail']:
  52. thumbnail = result['media$group']['media$thumbnail'][0]['url']
  53. content = result['content']['$t']
  54. # append result
  55. results.append({'url': url,
  56. 'title': title,
  57. 'content': content,
  58. 'template': 'videos.html',
  59. 'publishedDate': publishedDate,
  60. 'thumbnail': thumbnail})
  61. # return results
  62. return results