More LLM crawlers

merge-requests/30/head
Bob Mottram 2024-10-05 17:16:21 +01:00
parent d4084f6e9e
commit f2bd491900
1 changed files with 2 additions and 2 deletions

View File

@ -139,8 +139,8 @@ def blocked_user_agent(calling_domain: str, agent_str: str,
'petalbot', 'ai2bot', 'allenai', 'firecrawl', 'friendlycrawler',
'googleother', 'icc-crawler', 'scrapy', 'timpibot',
'velenpublic', 'webzio-extended', 'cohere-ai', 'facebookexternal',
'img2dataset', 'isscyberriskcrawler', 'sidetrade', 'kangaroo',
'iaskspider'
'img2dataset', 'isscyberriskcrawler', 'sidetrade', 'kangaroo.ai',
'kangaroo bot', 'iaskspider'
)
for bot_str in llm_bot_strings:
if bot_str in agent_str_lower: