diff options
| author | Markus Heiser <markus.heiser@darmarIT.de> | 2021-09-12 07:53:09 +0000 |
|---|---|---|
| committer | GitHub <noreply@github.com> | 2021-09-12 07:53:09 +0000 |
| commit | ecd6ca86d0ebe6a41902e8c980de46c5d0600eb6 (patch) | |
| tree | 157b41a60e69268d65d54f870b52399a701f5d64 /searx | |
| parent | 2de95af92330c83c7b1aecc146e0f52e8825c59b (diff) | |
| parent | 0f43b39eac44d548143b3944a2bfa26c039b2068 (diff) | |
Merge pull request #308 from dalf/plugin_hostname_replace
[enh] add hostname_replace plugin
Diffstat (limited to 'searx')
| -rw-r--r-- | searx/plugins/__init__.py | 2 | ||||
| -rw-r--r-- | searx/plugins/hostname_replace.py | 32 | ||||
| -rw-r--r-- | searx/settings.yml | 12 |
3 files changed, 45 insertions, 1 deletions
diff --git a/searx/plugins/__init__.py b/searx/plugins/__init__.py index 3a35f7025..1153c9ed1 100644 --- a/searx/plugins/__init__.py +++ b/searx/plugins/__init__.py @@ -31,6 +31,7 @@ from searx.plugins import (oa_doi_rewrite, hash_plugin, infinite_scroll, self_info, + hostname_replace, search_on_category_select, tracker_url_remover, vim_hotkeys) @@ -182,6 +183,7 @@ plugins.register(oa_doi_rewrite) plugins.register(hash_plugin) plugins.register(infinite_scroll) plugins.register(self_info) +plugins.register(hostname_replace) plugins.register(search_on_category_select) plugins.register(tracker_url_remover) plugins.register(vim_hotkeys) diff --git a/searx/plugins/hostname_replace.py b/searx/plugins/hostname_replace.py new file mode 100644 index 000000000..778b84615 --- /dev/null +++ b/searx/plugins/hostname_replace.py @@ -0,0 +1,32 @@ +# SPDX-License-Identifier: AGPL-3.0-or-later + +import re +from urllib.parse import urlunparse +from searx import settings +from searx.plugins import logger +from flask_babel import gettext + +name = gettext('Hostname replace') +description = gettext('Rewrite result hostnames or remove results based on the hostname') +default_on = False +preference_section = 'general' + +plugin_id = 'hostname_replace' + +replacements = {re.compile(p): r for (p, r) in settings[plugin_id].items()} if plugin_id in settings else {} + +logger = logger.getChild(plugin_id) +parsed = 'parsed_url' + + +def on_result(request, search, result): + if parsed not in result: + return True + for (pattern, replacement) in replacements.items(): + if pattern.search(result[parsed].netloc): + if not replacement: + return False + result[parsed] = result[parsed]._replace(netloc=pattern.sub(replacement, result[parsed].netloc)) + result['url'] = urlunparse(result[parsed]) + + return True diff --git a/searx/settings.yml b/searx/settings.yml index e5eb9dd65..8e2aeb5e9 100644 --- a/searx/settings.yml +++ b/searx/settings.yml @@ -150,7 +150,17 @@ outgoing: # # enabled_plugins: # - "HTTPS rewrite" -# - ... +# - "Hostname replace" # see configuration below + +# "Hostname replace" plugin configuration example: +# hostname_replace: +# '(.*\.)?youtube\.com$': 'invidious.example.com' +# '(.*\.)?youtu\.be$': 'invidious.example.com' +# '(.*\.)?youtube-noocookie\.com$': 'yotter.example.com' +# '(.*\.)?reddit\.com$': 'teddit.example.com' +# '(.*\.)?redd\.it$': 'teddit.example.com' +# '(www\.)?twitter\.com$': 'nitter.example.com' +# 'spam\.example\.com': false # remove results from spam.example.com checker: # disable checker when in debug mode |