From 7c80807bb8204e9ef0df9a39207e30587c856c0a Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=C3=89milien=20=28perso=29?= <4016501+unixfox@users.noreply.github.com> Date: Wed, 17 Jan 2024 09:14:36 +0100 Subject: [PATCH] Block HeadlessChrome (#3116) --- searx/botdetection/http_user_agent.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/searx/botdetection/http_user_agent.py b/searx/botdetection/http_user_agent.py index e2e02a9bb..9e45c7f9d 100644 --- a/searx/botdetection/http_user_agent.py +++ b/searx/botdetection/http_user_agent.py @@ -35,7 +35,7 @@ USER_AGENT = ( + r'|HttpClient|Jersey|Python|libwww-perl|Ruby|SynHttpClient|UniversalFeedParser|Googlebot|GoogleImageProxy' + r'|bingbot|Baiduspider|yacybot|YandexMobileBot|YandexBot|Yahoo! Slurp|MJ12bot|AhrefsBot|archive.org_bot|msnbot' + r'|MJ12bot|SeznamBot|linkdexbot|Netvibes|SMTBot|zgrab|James BOT|Sogou|Abonti|Pixray|Spinn3r|SemrushBot|Exabot' - + r'|ZmEu|BLEXBot|bitlybot' + + r'|ZmEu|BLEXBot|bitlybot|HeadlessChrome' # unmaintained Farside instances + r'|' + re.escape(r'Mozilla/5.0 (compatible; Farside/0.1.0; +https://farside.link)')