mirror of
https://github.com/ai-robots-txt/ai.robots.txt.git
synced 2025-04-05 19:37:45 +00:00
Merge branch 'main' into feature/add-table-of-crawler-detail
This commit is contained in:
commit
db06035714
3 changed files with 9 additions and 0 deletions
4
apache.conf.txt
Normal file
4
apache.conf.txt
Normal file
|
@ -0,0 +1,4 @@
|
||||||
|
# for apache2.conf or .htaccess; intended to block via user agent string
|
||||||
|
RewriteEngine On
|
||||||
|
RewriteCond %{HTTP_USER_AGENT} (AdsBot-Google|Amazonbot|anthropic-ai|Applebot|AwarioRssBot|AwarioSmartBot|Bytespider|CCBot|ChatGPT-User|ClaudeBot|Claude-Web|cohere-ai|DataForSeoBot|FacebookBot|FriendlyCrawler|Google-Extended|GoogleOther|GPTBot|ImagesiftBot|magpie-crawler|Meltwater|omgili|omgilibot|peer39_crawler|peer39_crawler/1.0|PerplexityBot|PiplBot|Seekr|YouBot) [NC]
|
||||||
|
RewriteRule .* - [F,L]
|
4
nginx.conf.txt
Normal file
4
nginx.conf.txt
Normal file
|
@ -0,0 +1,4 @@
|
||||||
|
# for nginx.conf; intended to block via user agent string
|
||||||
|
if ($http_user_agent ~* (AdsBot-Google|Amazonbot|anthropic-ai|Applebot|AwarioRssBot|AwarioSmartBot|Bytespider|CCBot|ChatGPT-User|ClaudeBot|Claude-Web|cohere-ai|DataForSeoBot|FacebookBot|FriendlyCrawler|Google-Extended|GoogleOther|GPTBot|ImagesiftBot|magpie-crawler|Meltwater|omgili|omgilibot|peer39_crawler|peer39_crawler/1.0|PerplexityBot|PiplBot|Seekr|YouBot)) {
|
||||||
|
return 403;
|
||||||
|
}
|
|
@ -12,6 +12,7 @@ User-agent: Claude-Web
|
||||||
User-agent: cohere-ai
|
User-agent: cohere-ai
|
||||||
User-agent: DataForSeoBot
|
User-agent: DataForSeoBot
|
||||||
User-agent: FacebookBot
|
User-agent: FacebookBot
|
||||||
|
User-agent: FriendlyCrawler
|
||||||
User-agent: Google-Extended
|
User-agent: Google-Extended
|
||||||
User-agent: GoogleOther
|
User-agent: GoogleOther
|
||||||
User-agent: GPTBot
|
User-agent: GPTBot
|
||||||
|
|
Loading…
Reference in a new issue