diff options
| author | Markus Heiser <markus.heiser@darmarit.de> | 2021-01-22 18:49:45 +0100 |
|---|---|---|
| committer | Markus Heiser <markus.heiser@darmarit.de> | 2021-01-22 18:49:45 +0100 |
| commit | baec54c49295020bd925e34a705afca29d7458f3 (patch) | |
| tree | f8a9c8c6c28c6596249cf735cbb2b34fb20ca76d /searx/engines/google_images.py | |
| parent | f310305c54c3cd1d9fc74f09453294edbd2b5486 (diff) | |
[fix] revise of the google-news engine
This revise is based on the methods developed in the revise of the google engine
(see commit 410c2f9).
Signed-off-by: Markus Heiser <markus.heiser@darmarit.de>
Diffstat (limited to 'searx/engines/google_images.py')
| -rw-r--r-- | searx/engines/google_images.py | 12 |
1 files changed, 3 insertions, 9 deletions
diff --git a/searx/engines/google_images.py b/searx/engines/google_images.py index 8c2cb9d2a..612682c44 100644 --- a/searx/engines/google_images.py +++ b/searx/engines/google_images.py @@ -12,10 +12,9 @@ Definitions`_. Header set Content-Security-Policy "img-src 'self' data: ;" """ -from urllib.parse import urlencode, urlparse, unquote +from urllib.parse import urlencode, unquote from lxml import html from searx import logger -from searx.exceptions import SearxEngineCaptchaException from searx.utils import extract_text, eval_xpath from searx.engines.google import _fetch_supported_languages, supported_languages_url # NOQA # pylint: disable=unused-import @@ -23,6 +22,7 @@ from searx.engines.google import ( get_lang_country, google_domains, time_range_dict, + detect_google_sorry, ) logger = logger.getChild('google images') @@ -123,13 +123,7 @@ def response(resp): """Get response from google's search request""" results = [] - # detect google sorry - resp_url = urlparse(resp.url) - if resp_url.netloc == 'sorry.google.com' or resp_url.path == '/sorry/IndexRedirect': - raise SearxEngineCaptchaException() - - if resp_url.path.startswith('/sorry'): - raise SearxEngineCaptchaException() + detect_google_sorry(resp) # which subdomain ? # subdomain = resp.search_params.get('google_subdomain') |