block all spiders by default, allow major ones

This commit is contained in:
joshua stein 2013-06-25 13:56:31 -05:00
parent ed512cc065
commit b1e9e359a3

View file

@ -1,5 +1,16 @@
# no caching
User-agent: ia_archiver
# block all spiders by default
User-agent: *
Disallow: /
User-agent: archive.org_bot
# but allow major ones
User-agent: Googlebot
Allow: /
User-agent: Slurp
Allow: /
User-Agent: msnbot
Disallow:
User-agent: Baiduspider
Disallow: /