# robots.txt - to stop bots, spiders, crawlers, seacrh engines etc seeing certain directories or files # first created 21/02/2008 by A.N. User-Agent: * Disallow: /pagenotfound.html Disallow: /hrdl01/ Disallow: /viren001/ Disallow: /x-Event-Archive/ Disallow: /x-News-Archive/ Disallow: /test/ Disallow: /test1/ Disallow: /test2/ Disallow: /test3/ Disallow: /test4/ # higher level folders it should never get to anyway Disallow: /httpsdocs/ Disallow: /private/ Disallow: /anon_ftp/ Disallow: /subdomains/ # disallow pages with email addresses in - see if can stop harvesting ? disallow: /DealInqu1.html disallow: /EmplInqu1.html disallow: /PressInqu2.html disallow: /Contact-Us1.html disallow: /SaleInqu1.html disallow: /InveInqu1.html disallow: /PageNotFound.html disallow: /hi-resDL1.html