# $Id: robots.txt,v 1.9.2.2 2010/09/06 10:37:16 goba Exp $ # # robots.txt # # This file is to prevent the crawling and indexing of certain parts # of your site by web crawlers and spiders run by sites like Yahoo! # and Google. By telling these "robots" where not to go on your site, # you save bandwidth and server resources. # # This file will be ignored unless it is at the root of your host: # Used: http://example.com/robots.txt # Ignored: http://example.com/site/robots.txt # # For more information about the robots.txt standard, see: # http://www.robotstxt.org/wc/robots.html # # For syntax checking, see: # http://www.sxw.org.uk/computing/robots/check.html User-agent: * Crawl-delay: 10 # Directories Disallow: /includes/ Disallow: /misc/ Disallow: /modules/ Disallow: /profiles/ Disallow: /scripts/ Disallow: /sites/ Disallow: /themes/ # Files Disallow: /CHANGELOG.txt Disallow: /cron.php Disallow: /INSTALL.mysql.txt Disallow: /INSTALL.pgsql.txt Disallow: /install.php Disallow: /INSTALL.txt Disallow: /LICENSE.txt Disallow: /MAINTAINERS.txt Disallow: /update.php Disallow: /UPGRADE.txt Disallow: /xmlrpc.php # Paths (clean URLs) Disallow: /admin/ Disallow: /comment/reply/ Disallow: /contact/ Disallow: /logout/ Disallow: /node/add/ Disallow: /node/edit/ Disallow: /search/ Disallow: /user/register/ Disallow: /user/password/ Disallow: /user/login/ # Paths (no clean URLs) Disallow: /?q=admin/ Disallow: /?q=comment/reply/ Disallow: /?q=contact/ Disallow: /?q=logout/ Disallow: /?q=node/add/ Disallow: /?q=node/edit/ Disallow: /?q=search/ Disallow: /?q=user/password/ Disallow: /?q=user/register/ Disallow: /?q=user/login/ # stop the bleeding on these patterns that now correctly return 404 # google stop crawling these! Disallow: */.../ Disallow: *..?page= Disallow: */page/*?page= Disallow: */www.*. Disallow: */user/password$ Disallow: */user/password?page= Disallow: */help$ Disallow: */help?page= Disallow: *2009/*/2009/ Disallow: *2010/*/2010/ Disallow: *r:t$ Disallow: *r:t?page= Disallow: *@* Disallow: /www/ Disallow: */01.aspx Disallow: */02.aspx Disallow: */03.aspx Disallow: */04.aspx Disallow: */05.aspx Disallow: */06.aspx Disallow: */07.aspx Disallow: */08.aspx Disallow: */09.aspx Disallow: */10.aspx Disallow: */11.aspx Disallow: */12.aspx Disallow: */0?page Disallow: */1?page Disallow: */2?page Disallow: */3?page Disallow: */4?page Disallow: */5?page Disallow: */6?page Disallow: */7?page Disallow: */8?page Disallow: */9?page Disallow: */comment-page- Disallow: */scanner/https:// Disallow: */rss.aspx Disallow: *.aspx?utm_source=feedburner Disallow: /CS/controlpanel/ Disallow: /cs/controlpanel/ Disallow: /CS/user/ Disallow: /PickUPedia/ Disallow: /aboutus/contributors/ Disallow: /category/archived-categories Disallow: /category/archived-tags Disallow: /category/advice-categories Disallow: /category/advice-tag Disallow: /category/extrafeatures-categories Disallow: /category/extrafeatures-tags Disallow: /category/photofeatures-categories Disallow: /category/scanner-categories Disallow: /category/scanner-tag Disallow: /scanner/tag/ Disallow: /scanner/category/ Disallow: /cs/blogs/*/archive/tags/ Disallow: /CS/blogs/*/archive/tags/ Disallow: /advice/tag/ Disallow: /entertainment/category/ Disallow: /toolsofattraction/tag/ Disallow: *ConfessionalEntry.aspx Disallow: */moreTwis.asp Disallow: /aboutUs/contributors/ Disallow: /aboutUs/Contributors/ Disallow: /aboutus/contributors/ Disallow: /aboutus/Contributors/ Disallow: *Response.asp?auth= Disallow: /giveandtake/ Disallow: /pickupedia/ Disallow: /rg/ Disallow: /scanner/feed?page Disallow: /scanner/2010?page Disallow: /scanner/page/ Disallow: /scanner/wp-admin/ Disallow: /scanner/wp-content/ Disallow: /toolsofattraction/feed/ Disallow: /scanner/2009/*?page= Disallow: /scanner/2010/*?page= Disallow: */printcopy.asp Disallow: /cs/search/ Disallow: //