ebay.py 2.1 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768
  1. # Ebay (Videos, Music, Files)
  2. #
  3. # @website https://www.ebay.com
  4. # @provide-api no (nothing found)
  5. #
  6. # @using-api no
  7. # @results HTML (using search portal)
  8. # @stable yes (HTML can change)
  9. # @parse url, title, content, price, shipping, source
  10. from lxml import html
  11. from searx.engines.xpath import extract_text
  12. from urllib.parse import quote
  13. categories = ['shopping']
  14. paging = True
  15. url = 'https://www.ebay.com'
  16. search_url = url + '/sch/i.html?_nkw={query}&_sacat={pageno}'
  17. results_xpath = '//li[contains(@class, "s-item")]'
  18. url_xpath = './/a[@class="s-item__link"]/@href'
  19. title_xpath = './/h3[@class="s-item__title"]'
  20. content_xpath = './/div[@span="SECONDARY_INFO"]'
  21. price_xpath = './/div[contains(@class, "s-item__detail")]/span[@class="s-item__price"][1]/text()'
  22. shipping_xpath = './/span[contains(@class, "s-item__shipping")]/text()'
  23. source_country_xpath = './/span[contains(@class, "s-item__location")]/text()'
  24. thumbnail_xpath = './/img[@class="s-item__image-img"]/@src'
  25. def request(query, params):
  26. params['url'] = search_url.format(query=quote(query), pageno=params['pageno'])
  27. return params
  28. def response(resp):
  29. results = []
  30. dom = html.fromstring(resp.text)
  31. results_dom = dom.xpath(results_xpath)
  32. if not results_dom:
  33. return []
  34. for result_dom in results_dom:
  35. url = extract_text(result_dom.xpath(url_xpath))
  36. title = extract_text(result_dom.xpath(title_xpath))
  37. content = extract_text(result_dom.xpath(content_xpath))
  38. price = extract_text(result_dom.xpath(price_xpath))
  39. shipping = extract_text(result_dom.xpath(shipping_xpath))
  40. source_country = extract_text(result_dom.xpath(source_country_xpath))
  41. thumbnail = extract_text(result_dom.xpath(thumbnail_xpath))
  42. if title == "":
  43. continue
  44. results.append({
  45. 'url': url,
  46. 'title': title,
  47. 'content': content,
  48. 'price': price,
  49. 'shipping': shipping,
  50. 'source_country': source_country,
  51. 'thumbnail': thumbnail,
  52. 'template': 'products.html',
  53. })
  54. return results