Add more spiders which do not seem to honour robots.txt #2135
1 changed files with 5 additions and 0 deletions
|
@ -51,6 +51,11 @@ Alias /robots.txt /var/www/robots.txt
|
|||
RewriteEngine on
|
||||
RewriteRule ^/$ /nagios/ [R]
|
||||
|
||||
# Spiders-gone-wild
|
||||
# These spiders may not follow robots.txt and will
|
||||
# hit admin sections which consume large amounts of CPU
|
||||
RewriteCond %{HTTP_USER_AGENT} ^.*(Bytespider|ClaudeBot|Amazonbot|YandexBot|ChatGLM-Spider|GPTBot|Barkrowler|YisouSpider|MJ12bot).*$ [NC]
|
||||
RewriteRule .* - [F,L]
|
||||
|
||||
Alias /nagios /usr/share/nagios/html/
|
||||
<Directory "/usr/share/nagios/html">
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue