# robots.txt for http://www.ithaca.edu/ User-agent: * # All spiders should avoid Disallow: /cgi-bin/ # Script files Disallow: /computing/cgi-bin/ # Script files Disallow: /its/cgi-bin/ # Script files Disallow: /work/ # The test area for web experimentation Disallow: /webdev/ # The test area for web experimentation Disallow: /itswebdev/ # The test area for web experimentation Disallow: /web_admin/Stats/ # Huge server statistic logs Disallow: /web_admin/MOMspider/ # MOMspider output Disallow: /courses/ # Exclude student course directories Disallow: /computing/seniorstaff/secure # Exclude ACCS secure areaxy Disallow: /students/chintze1/ # Reallow when she is back from Spain Disallow: /noaccess # No access space Disallow: /stats/ Disallow: /hs/depts/chemistry/facstaff/eonah/ #Dispite 404, still appears in results Disallow: /intercom/article.php/20100411200124486 #Intercom redirects instead of 404'ing