# $Id: robots.txt,v 1.18 2003/08/20 15:42:41 krusch Exp bolger $ # # This is a file retrieved by webwalkers a.k.a. spiders that # conform to a defacto standard. # See # # Comments to the webmaster should be posted at # # Format is: # User-agent: # Disallow: | # Flag Date By Reason # $l1- 19950130 epc finally understood what the file was for! # $L2= 19960909 epc fixed url since mak moved to Webcrawler... # $L3= 19970811 epc drop /Stretch # $L4= 19991102 krusch fixed User-agent capitalization and contact info # $L5= 20010327 krusch Updated disallow rules # $L6= 20041015 kapil Added rules to disallow results pages for task based navigation # ----------------------------------------------------------------------------- User-agent: * Disallow: // Disallow: /Admin Disallow: /admin Disallow: /zx Disallow: /zz Disallow: /common Disallow: /cgi-bin Disallow: /scripts Disallow: /Scripts Disallow: /i/ Disallow: /image Disallow: /Search Disallow: /search Disallow: /link Disallow: /perl Disallow: /tmp Disallow: /account/registration Disallow: /webmaster Disallow: /products/finder Disallow: /products/learn/action User-agent: Fast corporate crawler Disallow: // Disallow: /Admin Disallow: /admin Disallow: /zx Disallow: /zz Disallow: /common Disallow: /cgi-bin Disallow: /scripts Disallow: /Scripts Disallow: /i/ Disallow: /image Disallow: /Search Disallow: /search Disallow: /link Disallow: /perl Disallow: /tmp Disallow: /webmaster