# $Id: robots.txt,v 1.9 2007/06/27 22:37:44 goba Exp $ # # robots.txt # # This file is to prevent the crawling and indexing of certain parts # of your site by web crawlers and spiders run by sites like Yahoo! # and Google. By telling these "robots" where not to go on your site, # you save bandwidth and server resources. # # This file will be ignored unless it is at the root of your host: # Used: http://example.com/robots.txt # Ignored: http://example.com/site/robots.txt # # For more information about the robots.txt standard, see: # http://www.robotstxt.org/wc/robots.html # # For syntax checking, see: # http://www.sxw.org.uk/computing/robots/check.html # Directories User-agent: * Disallow: /userlist/content Disallow: /userlist/content/ Disallow: /s/ Disallow: /*/book/* Disallow: /*/book* Disallow: /*/book Disallow: /*/export* Disallow: /*/export/* Disallow: /database/ Disallow: /includes/ Disallow: /misc/ Disallow: /modules/ Disallow: /sites/ Disallow: /themes/ Disallow: /scripts/ Disallow: /updates/ Disallow: /profiles/ Disallow: /profile Disallow: /profile/ # Files Disallow: /xmlrpc.php Disallow: /cron.php Disallow: /update.php Disallow: /install.php Disallow: /INSTALL.txt Disallow: /INSTALL.mysql.txt Disallow: /INSTALL.pgsql.txt Disallow: /CHANGELOG.txt Disallow: /MAINTAINERS.txt Disallow: /LICENSE.txt Disallow: /UPGRADE.txt # Paths (clean URLs) Disallow: /admin/ Disallow: /comment/reply/ #Disallow: /contact Disallow: /logout/ Disallow: /node/add/ Disallow: /search/ Disallow: /user/register/ Disallow: /user/password/ Disallow: /user/password Disallow: /user/login/ Disallow: /user/ # Paths (no clean URLs) Disallow: /?q=es/ Disallow: /?q=es Disallow: /?q Disallow: /?q=admin/ Disallow: /?q=comment/reply/ Disallow: /?q=contact/ Disallow: /?q=logout/ Disallow: /?q=node/add/ Disallow: /?q=search/ Disallow: /?q=user/password/ Disallow: /?q=user/ Disallow: /?q=user/register/ Disallow: /?q=user/login/ Disallow: /user/ #Disallow: /user Disallow: /admin Disallow: /admin/ Disallow: /node/add Disallow: /node/add/ Disallow: /aggregator/ Disallow: /aggregator Disallow: /comment/ Disallow: /comment #Disallow: /contact #Disallow: /contact/ Disallow: /logout Disallow: /logout/ Disallow: /search/ Disallow: /search Disallow: /tribune Disallow: /tribune/ Disallow: /calendar Disallow: /calendar/ Disallow: /Calendar Disallow: /Calendar/ #Disallow: /tracker #Disallow: /tracker/ #Disallow: /*/track/ #Disallow: /tracker? #Disallow: /*/feed$ #Disallow: /*/feed* #Disallow: /*/feed/ #Disallow: /blog/ #Disallow: /*/track$ Disallow: /*/subscribe Disallow: /*/subscribe/ Disallow: /*/subscribe* # Views and Forum module problem: Disallow: /*sort= # Image module problem Disallow: /*size= #This avoids the creation of a duplicate home-page. # The URL http://example.com/node is a duplicate of http://example.com/. Disallow: /node$ Disallow: /print/ Disallow: /es Disallow: /es/ #Disallow: /category #Disallow: /category/ Disallow: /messages Disallow: /messages/ Disallow: /taxonomy Disallow: /taxonomy/ Disallow: /taxonomy_vtn Disallow: /taxonomy_vtn/ Disallow: /aggregator Disallow: /aggregator/ Disallow: /*/guestbook #Disallow: /node #Disallow: /node/ #This disallows the numerical forum urls (can still access at # /forums/nicaragua etc). #Disallow: /forum/ Disallow: /image_captcha Disallow: /image_captcha/ #Disallow: /? #Disallow: /?page=* #Disallow: /?page= #Disallow: /?page=1 #Disallow: /?page=2 #Disallow: /?page=4 #Disallow: /?page=3 #Disallow: /?page=5 #Disallow: /?page=6 #Disallow: /?page=7 #Disallow: /?page=8 #Disallow: /?page=9 #Disallow: /?page=10 #Disallow: /?page=11 #Disallow: /?page=12 #Disallow: /?page=13 #Disallow: /?page=14 #Disallow: /?page=15 #Disallow: /?page=16 #Disallow: /?page=17 #Disallow: /popular #Disallow: /popular/ #Disallow: /node/ #Disallow: /search #Disallow: /piwik #Disallow: /piwik.php #Disallow: /piwik/ #Disallow: /search$ #Disallow: /*?page=0,0$ #Disallow: /*?page=0,1000$ #Disallow: /central-america-latest-blogs #Disallow: /central-america-news #Disallow: /central-america-latest-blogs?page=* #Disallow: /central-america-news?page=* Allow: / Allow: /sites/*/files/ Allow: /*peter-blog*