parent
7567dd74f3
commit
2d64cef6e0
3 changed files with 78 additions and 0 deletions
76
Bots and Crawler.txt
Normal file
76
Bots and Crawler.txt
Normal file
|
@ -0,0 +1,76 @@
|
|||
BLEXBot
|
||||
Barkrowler
|
||||
Livelapbot
|
||||
Franck, the Fediverse Graph Crawler
|
||||
YisouSpider
|
||||
DotBot
|
||||
VelenPublicWebCrawler
|
||||
ChatGPT-User
|
||||
GoogleOther
|
||||
GoogleOther-Image
|
||||
GoogleOther-Video
|
||||
Applebot
|
||||
Applebot-Extended
|
||||
AhrefsBot
|
||||
Baiduspider
|
||||
SemrushBot
|
||||
DotBot
|
||||
MJ12bot
|
||||
PetalBot
|
||||
SeznamBot
|
||||
Mediapartners-Google
|
||||
Bytespider
|
||||
Claude-Web
|
||||
GPTBot
|
||||
PerplexityBot
|
||||
Applebot
|
||||
Amazonbot
|
||||
Meta-ExternalAgent
|
||||
Meta-ExternalFetcher
|
||||
FacebookBot
|
||||
DuckAssistBot
|
||||
Anthropic-ai
|
||||
Bytedance
|
||||
fidget-spinner-bot
|
||||
EmailCollector
|
||||
WebEMailExtrac
|
||||
ClaudeBot
|
||||
facebookexternalhit
|
||||
facebookcatalog
|
||||
YandexBot
|
||||
Bingbot
|
||||
Googlebot
|
||||
AI2Bot
|
||||
Ai2Bot-Dolma
|
||||
Brightbot
|
||||
CCBot
|
||||
ChatGPT-User
|
||||
cohere-ai
|
||||
cohere-training-data-crawler
|
||||
Crawlspace
|
||||
Diffbot
|
||||
FriendlyCrawler
|
||||
Google-Extended
|
||||
GoogleOther
|
||||
GoogleOther-Image
|
||||
GoogleOther-Video
|
||||
iaskspider
|
||||
ICC-Crawler
|
||||
ImagesiftBot
|
||||
img2dataset
|
||||
ISSCyberRiskCrawler
|
||||
KangarooBot
|
||||
OAI-SearchBot
|
||||
omgili
|
||||
omgilibot
|
||||
PanguBot
|
||||
Perplexity-User
|
||||
PetalBot
|
||||
Scrapy
|
||||
SemrushBot-OCOB
|
||||
SemrushBot-SWA
|
||||
Sidetradeindexerbot
|
||||
Timpibot
|
||||
VelenPublicWebCrawler
|
||||
Webzio-Extended
|
||||
YouBot
|
Loading…
Add table
Add a link
Reference in a new issue