tracker_url_remover.py 1.3 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344
  1. '''
  2. searx is free software: you can redistribute it and/or modify
  3. it under the terms of the GNU Affero General Public License as published by
  4. the Free Software Foundation, either version 3 of the License, or
  5. (at your option) any later version.
  6. searx is distributed in the hope that it will be useful,
  7. but WITHOUT ANY WARRANTY; without even the implied warranty of
  8. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  9. GNU Affero General Public License for more details.
  10. You should have received a copy of the GNU Affero General Public License
  11. along with searx. If not, see < http://www.gnu.org/licenses/ >.
  12. (C) 2015 by Adam Tauber, <asciimoo@gmail.com>
  13. '''
  14. from flask.ext.babel import gettext
  15. import re
  16. regexes = {re.compile(r'utm_[^&]+&?'),
  17. re.compile(r'(wkey|wemail)[^&]+&?'),
  18. re.compile(r'&$')}
  19. name = gettext('Tracker URL remover')
  20. description = gettext('Remove trackers arguments from the returned URL')
  21. default_on = True
  22. def on_result(request, ctx):
  23. splited_url = ctx['result']['url'].split('?')
  24. if len(splited_url) is not 2:
  25. return True
  26. for reg in regexes:
  27. splited_url[1] = reg.sub('', splited_url[1])
  28. if splited_url[1] == "":
  29. ctx['result']['url'] = splited_url[0]
  30. else:
  31. ctx['result']['url'] = splited_url[0] + '?' + splited_url[1]
  32. return True