# Robots.txt file for domain: http://www.adoptapet-directory.com # These robots either waste resources, harvest emails, or # do some other "bad" thing, but at least they obey the # robots.txt file. They're not allowed here. User-agent: almaden User-agent: ASPSeek User-agent: baiduspider User-agent: dumbBot User-agent: Generic User-agent: grub-client User-agent: MSIECrawler User-agent: NexaBot User-agent: NPBot User-agent: OWR_Crawler User-agent: psbot User-agent: rabaz User-agent: RPT-HTTPClient User-agent: ScoutAbout User-agent: semanticdiscovery User-agent: TurnitinBot User-agent: Wget Disallow: / # All other robots will be allowed to spider the domain # but are requested not to spider the images, and # document directories User-agent: * Disallow: /images/ Disallow: /maint/ Disallow: /cgi-bin/apf4/ # # This is simply bait. If they go here, after being # told not to, I simply won't be responsible for what happens. # Disallow: /users/ # # Disallow the following directories to optimize page rank. # Disallow: /forum/admin/ Disallow: /forum/db/ Disallow: /forum/images/ Disallow: /forum/includes/ Disallow: /forum/language/ Disallow: /forum/templates/ Disallow: /forum/common.php Disallow: /forum/config.php Disallow: /forum/faq.php Disallow: /forum/groupcp.php Disallow: /forum/login.php Disallow: /forum/memberlist.php Disallow: /forum/modcp.php Disallow: /forum/posting.php Disallow: /forum/privmsg.php Disallow: /forum/profile.php Disallow: /forum/search.php Disallow: /forum/viewonline.php