# GoogleBot User-agent: GOOGLEBOT Disallow: /cgi-bin/ Disallow: /takethis/ # GoogleBot Image User-agent: Googlebot-Image Disallow: / # Altavista User-agent: Scooter Disallow: /cgi-bin/ Disallow: /takethis/ User-agent: Altavista Disallow: /cgi-bin/ Disallow: /takethis/ # http://fast.no/ User-agent: FAST Disallow: /cgi-bin/ Disallow: /takethis/ # The Wayback Machine: http://www.archive.org/ User-agent: ia_archiver Disallow: / # From: Dansk Bibliotekscenter A/S User-agent: Ankiro Disallow: / # User-agent: mia Disallow: / # Lycos User-Agent: T-Rex Disallow: /cgi-bin/ Disallow: /takethis/ # Well, at all we didn't see a request for /robots.txt - so just block them ... User-Agent: sitecheck.internetseer.com Disallow: / # Looks like Zeus don't respect /robots.txt and META TAGS ... User-agent: Zeus Disallow: / # User-agent: ZyBorg Disallow: / # User-agent: grub-client Disallow: / # M$ User-agent: MSIECrawler Disallow: / # M$ User-agent: msnbot Disallow: / ## Disallowing Access - Specific robots ## NO access (e-collector, CMC/0.01, Google Image) #User-agent: ecollector #User-agent: CMC/0.01 #User-agent: Googlebot-Image #Disallow: / ## Spider from Example.invalid #User-agent: Example #Disallow: /dir1/ #Disallow: /dir2/ #Disallow: /dir3/ # Default User-agent: * Disallow: / Disallow: /cgi-bin/ Disallow: /takethis/