From 3d2c9e8361c1701ee2a87a55ba3c323ed9ad57c7 Mon Sep 17 00:00:00 2001 From: Dr Kim Foale Date: Tue, 20 Aug 2024 23:19:25 +0100 Subject: [PATCH] feat: Add robots.txt to ask AI bots not to crawl the site (#2569) --- config/robots/robots.production.txt | 35 +++++++++++++++++++++++++++++ 1 file changed, 35 insertions(+) diff --git a/config/robots/robots.production.txt b/config/robots/robots.production.txt index 726a20754..79b383864 100644 --- a/config/robots/robots.production.txt +++ b/config/robots/robots.production.txt @@ -6,3 +6,38 @@ User-agent: * Disallow: /assets/ + +User-agent: Amazonbot +User-agent: Applebot +User-agent: Applebot-Extended +User-agent: Bytespider +User-agent: CCBot +User-agent: ChatGPT-User +User-agent: Claude-Web +User-agent: ClaudeBot +User-agent: Diffbot +User-agent: FacebookBot +User-agent: FriendlyCrawler +User-agent: GPTBot +User-agent: Google-Extended +User-agent: GoogleOther +User-agent: GoogleOther-Image +User-agent: GoogleOther-Video +User-agent: ICC-Crawler +User-agent: ImagesiftBot +User-agent: Meta-ExternalAgent +User-agent: Meta-ExternalFetcher +User-agent: OAI-SearchBot +User-agent: PerplexityBot +User-agent: PetalBot +User-agent: Scrapy +User-agent: Timpibot +User-agent: VelenPublicWebCrawler +User-agent: YouBot +User-agent: anthropic-ai +User-agent: cohere-ai +User-agent: facebookexternalhit +User-agent: img2dataset +User-agent: omgili +User-agent: omgilibot +Disallow: / \ No newline at end of file