# GoogleBot User-agent: GOOGLEBOT Disallow: /cgi-bin/ Disallow: /see/ Disallow: /da Disallow: /en # GoogleBot Image User-agent: Googlebot-Image Disallow: / # Altavista User-agent: Scooter Disallow: /cgi-bin/ Disallow: /see/ Disallow: /da Disallow: /en User-agent: Altavista Disallow: /cgi-bin/ Disallow: /see/ Disallow: /da Disallow: /en # http://fast.no/ User-agent: FAST Disallow: /cgi-bin/ Disallow: /see/ Disallow: /da Disallow: /en # Wget User-agent: Wget Disallow: /cgi-bin/ Disallow: /see/ Disallow: /da Disallow: /en # The Wayback Machine: http://www.archive.org/ User-agent: ia_archiver Disallow: / # From: Dansk Bibliotekscenter A/S - collecting bot User-agent: Ankiro Disallow: / # User-agent: mia Disallow: / # Lycos User-Agent: T-Rex Disallow: /cgi-bin/ Disallow: /see/ Disallow: /da Disallow: /en # Bot @ Sitecheck - did we wanna them to grap HEAD info ? # Well, at all we didn't see a request for /robots.txt - so just block them ... User-Agent: sitecheck.internetseer.com Disallow: / # Looks like Zeus don't respect /robots.txt and META TAGS ... # Well, then just block the robot User-agent: Zeus Disallow: / # User-agent: ZyBorg Disallow: / # User-agent: grub-client Disallow: / # User-agent: MSIECrawler Disallow: / ## Spider from Example.invalid #User-agent: Example #Disallow: /dir1/ #Disallow: /dir2/ #Disallow: /dir3/ # Default - final block all others User-agent: * Disallow: /