[chore] Update robots.txt with more AI scrapers (#3248)

This commit is contained in:
Daenney 2024-08-29 17:42:48 +02:00 committed by GitHub
parent 1f3dfbf10c
commit 277b043633
No known key found for this signature in database
GPG key ID: B5690EEEBB952194

View file

@ -31,6 +31,8 @@ const (
# AI scrapers and the like. # AI scrapers and the like.
# https://github.com/ai-robots-txt/ai.robots.txt/ # https://github.com/ai-robots-txt/ai.robots.txt/
User-agent: AI2Bot
User-agent: Ai2Bot-Dolma
User-agent: AdsBot-Google User-agent: AdsBot-Google
User-agent: Amazonbot User-agent: Amazonbot
User-agent: anthropic-ai User-agent: anthropic-ai
@ -50,9 +52,11 @@ User-agent: GoogleOther
User-agent: GoogleOther-Image User-agent: GoogleOther-Image
User-agent: GoogleOther-Video User-agent: GoogleOther-Video
User-agent: GPTBot User-agent: GPTBot
User-agent: ICC-Crawler
User-agent: ImagesiftBot User-agent: ImagesiftBot
User-agent: img2dataset User-agent: img2dataset
User-agent: Meta-ExternalAgent User-agent: Meta-ExternalAgent
User-agent: Meta-ExternalFetcher
User-agent: OAI-SearchBot User-agent: OAI-SearchBot
User-agent: omgili User-agent: omgili
User-agent: omgilibot User-agent: omgilibot
@ -61,6 +65,7 @@ User-agent: PetalBot
User-agent: Scrapy User-agent: Scrapy
User-agent: Timpibot User-agent: Timpibot
User-agent: VelenPublicWebCrawler User-agent: VelenPublicWebCrawler
User-agent: Webzio-Extended
User-agent: YouBot User-agent: YouBot
Disallow: / Disallow: /