mirror of https://gitlab.com/bashrc2/epicyon
Extra LLM crawler
parent
a738e1316e
commit
0ec43c6323
|
@ -135,7 +135,7 @@ def blocked_user_agent(calling_domain: str, agent_str: str,
|
||||||
'facebookbot', 'google-extended', 'piplbot', 'oai-search',
|
'facebookbot', 'google-extended', 'piplbot', 'oai-search',
|
||||||
'applebot-extended', 'meta-external', 'diffbot', 'perplexitybot',
|
'applebot-extended', 'meta-external', 'diffbot', 'perplexitybot',
|
||||||
'omgili', 'imagesiftbot', 'bytespider', 'amazonbot', 'youbot',
|
'omgili', 'imagesiftbot', 'bytespider', 'amazonbot', 'youbot',
|
||||||
'petalbot'
|
'petalbot', 'ai2bot', 'allenai'
|
||||||
)
|
)
|
||||||
for bot_str in llm_bot_strings:
|
for bot_str in llm_bot_strings:
|
||||||
if bot_str in agent_str_lower:
|
if bot_str in agent_str_lower:
|
||||||
|
|
Loading…
Reference in New Issue