1234567891011121314151617181920212223242526272829303132333435363738 |
- from urllib import urlencode
- from HTMLParser import HTMLParser
- from xpath import extract_text
- from lxml import html
- base_url = 'http://vimeo.com'
- search_url = base_url + '/search?{query}'
- Cookie = {
-
-
- '__utma':'00000000.000#0000000.0000000000.0000000000.0000000000.0'
-
-
-
-
- }
- def request(query, params):
- params['url'] = search_url.format(query=urlencode({'q' :query}))
- print params['url']
- params['cookies'] = Cookie
- return params
- def response(resp):
- results = []
- dom = html.fromstring(resp.text)
-
- p = HTMLParser()
- for result in dom.xpath(results_xpath):
- url = base_url + result.xpath(url_xpath)[0]
- title = p.unescape(extract_text(result.xpath(title_xpath)))
- content = '<a href="{0}"> <img src="{2}"/> </a>'.format(url, title, extract_text(result.xpath(content_xpath)[0]))
- results.append({'url': url, 'title': title, 'content': content})
- return results
|