diff options
| author | cy8aer <cybaer42@web.de> | 2018-07-09 15:34:43 +0200 |
|---|---|---|
| committer | GitHub <noreply@github.com> | 2018-07-09 15:34:43 +0200 |
| commit | 78be030500526ad073b1291baec6bfbf36eb221d (patch) | |
| tree | 35a567537690a7c84e76116798b61f7dd9befb0b /searx/engines | |
| parent | b786ac9a6360cc50472d572148343dc84b908830 (diff) | |
| parent | d51732c0e5e89f86abfe68718277a2e21b190103 (diff) | |
Merge branch 'master' into dsgvo
Diffstat (limited to 'searx/engines')
| -rw-r--r-- | searx/engines/bing.py | 5 | ||||
| -rw-r--r-- | searx/engines/wikidata.py | 3 |
2 files changed, 6 insertions, 2 deletions
diff --git a/searx/engines/bing.py b/searx/engines/bing.py index c6d41782b..2da40619d 100644 --- a/searx/engines/bing.py +++ b/searx/engines/bing.py @@ -16,7 +16,7 @@ from lxml import html from searx.engines.xpath import extract_text from searx.url_utils import urlencode -from searx.utils import match_language +from searx.utils import match_language, gen_useragent # engine dependent config categories = ['general'] @@ -43,6 +43,9 @@ def request(query, params): offset=offset) params['url'] = base_url + search_path + + params['headers']['User-Agent'] = gen_useragent('Windows NT 6.3; WOW64') + return params diff --git a/searx/engines/wikidata.py b/searx/engines/wikidata.py index fe53609c1..c315b30da 100644 --- a/searx/engines/wikidata.py +++ b/searx/engines/wikidata.py @@ -54,6 +54,7 @@ value_xpath = './/div[contains(@class,"wikibase-statementview-mainsnak")]'\ + '/*/div[contains(@class,"wikibase-snakview-value")]' language_fallback_xpath = '//sup[contains(@class,"wb-language-fallback-indicator")]' calendar_name_xpath = './/sup[contains(@class,"wb-calendar-name")]' +media_xpath = value_xpath + '//div[contains(@class,"commons-media-caption")]//a' def request(query, params): @@ -313,7 +314,7 @@ def add_image(result): for property_id in property_ids: image = result.xpath(property_xpath.replace('{propertyid}', property_id)) if image: - image_name = image[0].xpath(value_xpath) + image_name = image[0].xpath(media_xpath) image_src = url_image.replace('{filename}', extract_text(image_name[0])) return image_src |