From 8efc091fcbd5790b02a64f5af3e7da5193b87b23 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=C3=89milien=20=28perso=29?= <4016501+unixfox@users.noreply.github.com> Date: Thu, 11 Jan 2024 15:34:40 +0100 Subject: [PATCH] Block HeadlessChrome --- searx/botdetection/http_user_agent.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/searx/botdetection/http_user_agent.py b/searx/botdetection/http_user_agent.py index e2e02a9bb..9e45c7f9d 100644 --- a/searx/botdetection/http_user_agent.py +++ b/searx/botdetection/http_user_agent.py @@ -35,7 +35,7 @@ USER_AGENT = ( + r'|HttpClient|Jersey|Python|libwww-perl|Ruby|SynHttpClient|UniversalFeedParser|Googlebot|GoogleImageProxy' + r'|bingbot|Baiduspider|yacybot|YandexMobileBot|YandexBot|Yahoo! Slurp|MJ12bot|AhrefsBot|archive.org_bot|msnbot' + r'|MJ12bot|SeznamBot|linkdexbot|Netvibes|SMTBot|zgrab|James BOT|Sogou|Abonti|Pixray|Spinn3r|SemrushBot|Exabot' - + r'|ZmEu|BLEXBot|bitlybot' + + r'|ZmEu|BLEXBot|bitlybot|HeadlessChrome' # unmaintained Farside instances + r'|' + re.escape(r'Mozilla/5.0 (compatible; Farside/0.1.0; +https://farside.link)')