autocomplete.py 1.6 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364
  1. from lxml import etree
  2. from requests import get
  3. from json import loads
  4. from urllib import urlencode
  5. def dbpedia(query):
  6. # dbpedia autocompleter
  7. autocomplete_url = 'http://lookup.dbpedia.org/api/search.asmx/KeywordSearch?' # noqa
  8. response = get(autocomplete_url
  9. + urlencode(dict(QueryString=query)))
  10. results = []
  11. if response.ok:
  12. dom = etree.fromstring(response.content)
  13. results = dom.xpath('//a:Result/a:Label//text()',
  14. namespaces={'a': 'http://lookup.dbpedia.org/'})
  15. return results
  16. def duckduckgo(query):
  17. # wikipedia autocompleter
  18. url = 'https://ac.duckduckgo.com/ac/?{0}&type=list'
  19. resp = loads(get(url.format(urlencode(dict(q=query)))).text)
  20. if len(resp) > 1:
  21. return resp[1]
  22. return []
  23. def google(query):
  24. # google autocompleter
  25. autocomplete_url = 'http://suggestqueries.google.com/complete/search?client=toolbar&' # noqa
  26. response = get(autocomplete_url
  27. + urlencode(dict(q=query)))
  28. results = []
  29. if response.ok:
  30. dom = etree.fromstring(response.text)
  31. results = dom.xpath('//suggestion/@data')
  32. return results
  33. def wikipedia(query):
  34. # wikipedia autocompleter
  35. url = 'https://en.wikipedia.org/w/api.php?action=opensearch&{0}&limit=10&namespace=0&format=json' # noqa
  36. resp = loads(get(url.format(urlencode(dict(q=query)))).text)
  37. if len(resp) > 1:
  38. return resp[1]
  39. return []
  40. backends = {'dbpedia': dbpedia,
  41. 'duckduckgo': duckduckgo,
  42. 'google': google,
  43. 'wikipedia': wikipedia
  44. }