# Robots.txt for http://www.ippl-uk.org # Disallow Internet Archive’s crawler (and remove documents from the Wayback Machine) User-agent: ia_archiver Disallow: / # prevent spam-harvesting of old pages with plain-text email addresses # Disallow image bots User-agent: Googlebot-Image User-agent: psbot # picsearch.com User-agent: Yahoo-MMCrawler User-agent: Teoma # ask.com Disallow: /images/ Disallow: /thumbs/ Disallow: /catalog/ Disallow: /common/ # All other robots may spider the domain except for specified files & directories User-agent: * Disallow: /common/ # navigation, etc. gifs Disallow: /logs/ # site information - of no relevance to searches Disallow: /enquiry_response.htm # form post-submission page - of no relevance to searches Disallow: /css/ # style sheets - of no relevance to searches Disallow: /jscript/ # script - of no relevance to searches Disallow: /dev/ # future development Disallow: /flycounter/ # hit counter files