User-agent: * Crawl-delay: 10 # robots.txt for http://www.vegetarian.web.id/ # Last updated 1999/03/27 by jd # Rules apply to all robots # Cousin Directories - disallow the textfiles in the index directories # 'cos they'll keep changing, but allow the indexes # Disallow any files in /cousin begining with istcclr - legacy # Disallow: /.htaccess # Disallow: /guardian.cgi # Disallow: /search-articles.cgi # Disallow: /favicon.ico # Disallow: /recipes/favicon.ico # Excludes all root files and sub-directories to do with search Exclude: CGI Exclude: ico # Don't want the images to be indexed do we? Disallow: /cgi-bin/ Disallow: /image/afoto/ Disallow: /image/banner/ Disallow: /image/ttf # Error messages directory - principally the "Not Found" message #Disallow: /errormsg/ # Stats directories - constantly changing #Disallow: /logs/ # Need to tidy this up once search engine is back on-line #Disallow: /search.temporarily.withdrawn.html #Disallow the email directories #Disallow: /emaildir/ #Disallow: /contactsdir/