parent
7567dd74f3
commit
2d64cef6e0
3 changed files with 78 additions and 0 deletions
56
source/ai.robots.txt /robots.txt
Normal file
56
source/ai.robots.txt /robots.txt
Normal file
|
@ -0,0 +1,56 @@
|
||||||
|
User-agent: AI2Bot
|
||||||
|
User-agent: Ai2Bot-Dolma
|
||||||
|
User-agent: aiHitBot
|
||||||
|
User-agent: Amazonbot
|
||||||
|
User-agent: anthropic-ai
|
||||||
|
User-agent: Applebot
|
||||||
|
User-agent: Applebot-Extended
|
||||||
|
User-agent: Brightbot 1.0
|
||||||
|
User-agent: Bytespider
|
||||||
|
User-agent: CCBot
|
||||||
|
User-agent: ChatGPT-User
|
||||||
|
User-agent: Claude-Web
|
||||||
|
User-agent: ClaudeBot
|
||||||
|
User-agent: cohere-ai
|
||||||
|
User-agent: cohere-training-data-crawler
|
||||||
|
User-agent: Cotoyogi
|
||||||
|
User-agent: Crawlspace
|
||||||
|
User-agent: Diffbot
|
||||||
|
User-agent: DuckAssistBot
|
||||||
|
User-agent: FacebookBot
|
||||||
|
User-agent: Factset_spyderbot
|
||||||
|
User-agent: FirecrawlAgent
|
||||||
|
User-agent: FriendlyCrawler
|
||||||
|
User-agent: Google-Extended
|
||||||
|
User-agent: GoogleOther
|
||||||
|
User-agent: GoogleOther-Image
|
||||||
|
User-agent: GoogleOther-Video
|
||||||
|
User-agent: GPTBot
|
||||||
|
User-agent: iaskspider/2.0
|
||||||
|
User-agent: ICC-Crawler
|
||||||
|
User-agent: ImagesiftBot
|
||||||
|
User-agent: img2dataset
|
||||||
|
User-agent: imgproxy
|
||||||
|
User-agent: ISSCyberRiskCrawler
|
||||||
|
User-agent: Kangaroo Bot
|
||||||
|
User-agent: meta-externalagent
|
||||||
|
User-agent: meta-externalfetcher
|
||||||
|
User-agent: NovaAct
|
||||||
|
User-agent: OAI-SearchBot
|
||||||
|
User-agent: omgili
|
||||||
|
User-agent: omgilibot
|
||||||
|
User-agent: Operator
|
||||||
|
User-agent: PanguBot
|
||||||
|
User-agent: Perplexity-User
|
||||||
|
User-agent: PerplexityBot
|
||||||
|
User-agent: PetalBot
|
||||||
|
User-agent: Scrapy
|
||||||
|
User-agent: SemrushBot-OCOB
|
||||||
|
User-agent: SemrushBot-SWA
|
||||||
|
User-agent: Sidetrade indexer bot
|
||||||
|
User-agent: TikTokSpider
|
||||||
|
User-agent: Timpibot
|
||||||
|
User-agent: VelenPublicWebCrawler
|
||||||
|
User-agent: Webzio-Extended
|
||||||
|
User-agent: YouBot
|
||||||
|
Disallow: /
|
22
source/sekretaerbaer.de/Liste-sekretaerbaer.txt
Normal file
22
source/sekretaerbaer.de/Liste-sekretaerbaer.txt
Normal file
|
@ -0,0 +1,22 @@
|
||||||
|
AhrefsBot
|
||||||
|
Baiduspider
|
||||||
|
Barkrowler
|
||||||
|
Bingbot
|
||||||
|
BLEXBot
|
||||||
|
Bytedance
|
||||||
|
DotBot
|
||||||
|
EmailCollector
|
||||||
|
facebookcatalog
|
||||||
|
facebookexternalhit
|
||||||
|
fidget-spinner-bot
|
||||||
|
Franck the Fediverse Graph Crawler
|
||||||
|
Googlebot
|
||||||
|
Livelapbot
|
||||||
|
Mediapartners-Google
|
||||||
|
MJ12bot
|
||||||
|
SemrushBot
|
||||||
|
SeznamBot
|
||||||
|
VelenPublicWebCrawler
|
||||||
|
WebEMailExtrac
|
||||||
|
YandexBot
|
||||||
|
YisouSpider
|
Loading…
Add table
Add a link
Reference in a new issue