metacpan.py 2.0 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879
  1. # SPDX-License-Identifier: AGPL-3.0-or-later
  2. # lint: pylint
  3. """metacpan
  4. """
  5. from urllib.parse import urlunparse
  6. from json import dumps
  7. # about
  8. about = {
  9. "website": 'https://metacpan.org/',
  10. "wikidata_id": 'Q841507',
  11. "official_api_documentation": 'https://github.com/metacpan/metacpan-api/blob/master/docs/API-docs.md',
  12. "use_official_api": True,
  13. "require_api_key": False,
  14. "results": 'JSON',
  15. }
  16. # engine dependent config
  17. number_of_results = 20 # Don't put this over 5000
  18. categories = ["it", "packages"]
  19. disabled = True
  20. shortcut = "cpan"
  21. paging = True
  22. query_data_template = {
  23. 'query': {
  24. 'multi_match': {
  25. 'type': 'most_fields',
  26. 'fields': ['documentation', 'documentation.*'],
  27. 'analyzer': 'camelcase',
  28. }
  29. },
  30. 'filter': {
  31. 'bool': {
  32. 'must': [
  33. {'exists': {'field': 'documentation'}},
  34. {'term': {'status': 'latest'}},
  35. {'term': {'indexed': 1}},
  36. {'term': {'authorized': 1}},
  37. ]
  38. }
  39. },
  40. "sort": [
  41. {"_score": {"order": "desc"}},
  42. {"date": {"order": "desc"}},
  43. ],
  44. '_source': ['documentation', "abstract"],
  45. 'size': number_of_results,
  46. }
  47. search_url = urlunparse(["https", "fastapi.metacpan.org", "/v1/file/_search", "", "", ""])
  48. def request(query, params):
  49. params["url"] = search_url
  50. params["method"] = "POST"
  51. query_data = query_data_template
  52. query_data["query"]["multi_match"]["query"] = query
  53. query_data["from"] = (params["pageno"] - 1) * number_of_results
  54. params["data"] = dumps(query_data)
  55. return params
  56. def response(resp):
  57. results = []
  58. search_results = resp.json()["hits"]["hits"]
  59. for result in search_results:
  60. fields = result["_source"]
  61. module = fields["documentation"]
  62. results.append(
  63. {
  64. "url": "https://metacpan.org/pod/" + module,
  65. "title": module,
  66. "content": fields.get("abstract", ""),
  67. }
  68. )
  69. return results