summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
-rw-r--r--searx/engines/baidu.py9
1 files changed, 7 insertions, 2 deletions
diff --git a/searx/engines/baidu.py b/searx/engines/baidu.py
index 1c9d86733..29c9c0e4d 100644
--- a/searx/engines/baidu.py
+++ b/searx/engines/baidu.py
@@ -9,6 +9,7 @@
from urllib.parse import urlencode
from datetime import datetime
+from html import unescape
import time
import json
@@ -119,11 +120,15 @@ def parse_general(data):
except (ValueError, TypeError):
published_date = None
+ # title and content sometimes containing characters such as & ' " etc...
+ title = unescape(entry["title"])
+ content = unescape(entry.get("abs", ""))
+
results.append(
{
- "title": entry["title"],
+ "title": title,
"url": entry["url"],
- "content": entry.get("abs", ""),
+ "content": content,
"publishedDate": published_date,
}
)