# # robots.txt for http://www.w3.org/ # # $Id: robots.txt,v 1.45 2006/06/05 01:11:19 ted Exp $ # # For use by search.w3.org User-agent: W3C-gsa Disallow: /Out-Of-Date User-agent: Mozilla/4.0 (compatible; MSIE 6.0; Windows NT; MS Search 4.0 Robot) Disallow: / # W3C Link checker User-agent: W3C-checklink Disallow: # exclude some access-controlled areas User-agent: * Disallow: /artigos.php Disallow: /password_forgotten.php?osCsid=571fd4295086bdd1ae694481ffa89b25 Disallow: /obras Disallow: /noticias #Disallow: /2005/06/blog/ #Disallow: /2001/07/pubrules-checker #shouldnt get transparent proxies but will ml links of things like pubrules Disallow: /2000/06/webdata/xslt Disallow: /2000/09/webdata/xslt