summaryrefslogtreecommitdiff
path: root/searx/plugins/hostname_replace.py
blob: acbc6304c1dda84d829de70fdcb2c72d35c36989 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
# SPDX-License-Identifier: AGPL-3.0-or-later

import re
from urllib.parse import urlunparse, urlparse
from searx import settings
from searx.plugins import logger
from flask_babel import gettext

name = gettext('Hostname replace')
description = gettext('Rewrite result hostnames or remove results based on the hostname')
default_on = False
preference_section = 'general'

plugin_id = 'hostname_replace'

replacements = {re.compile(p): r for (p, r) in settings[plugin_id].items()} if plugin_id in settings else {}

logger = logger.getChild(plugin_id)
parsed = 'parsed_url'


def on_result(request, search, result):
    if parsed not in result:
        return True
    for (pattern, replacement) in replacements.items():
        if pattern.search(result[parsed].netloc):
            if not replacement:
                return False
            result[parsed] = result[parsed]._replace(netloc=pattern.sub(replacement, result[parsed].netloc))
            result['url'] = urlunparse(result[parsed])
        if result.get('data_src', False):
            parsed_data_src = urlparse(result['data_src'])
            if pattern.search(parsed_data_src.netloc):
                parsed_data_src = parsed_data_src._replace(netloc=pattern.sub(replacement, parsed_data_src.netloc))
                result['data_src'] = urlunparse(parsed_data_src)
        if result.get('audio_src', False):
            parsed_audio_src = urlparse(result['audio_src'])
            if pattern.search(parsed_audio_src.netloc):
                parsed_audio_src = parsed_audio_src._replace(netloc=pattern.sub(replacement, parsed_audio_src.netloc))
                result['audio_src'] = urlunparse(parsed_audio_src)

    return True