# $Id: robots.txt,v 1.9.2.1 2008/12/10 20:12:19 goba Exp $ # # robots.txt # # This file is to prevent the crawling and indexing of certain parts # of your site by web crawlers and spiders run by sites like Yahoo! # and Google. By telling these "robots" where not to go on your site, # you save bandwidth and server resources. # # This file will be ignored unless it is at the root of your host: # Used: http://example.com/robots.txt # Ignored: http://example.com/site/robots.txt # # For more information about the robots.txt standard, see: # http://www.robotstxt.org/wc/robots.html # # For syntax checking, see: # http://www.sxw.org.uk/computing/robots/check.html User-agent: * Crawl-delay: 10 # Directories Disallow: /_css/ Disallow: /_img/ Disallow: /_notes/ Disallow: /CNS Video Tour/ Disallow: /CNS-Draft1/ Disallow: /CNS-Draft2/ Disallow: /CNS-Draft3/ Disallow: /Drupal_old_includes/ Disallow: /Drupal_old_misc/ Disallow: /Drupal_old_modules/ Disallow: /Drupal_old_profiles/ Disallow: /Drupal_old_root/ Disallow: /Drupal_old_scripts/ Disallow: /Drupal_old_sites/ Disallow: /Drupal_old_themes/ Disallow: /dwnload/ Disallow: /exchange/ Disallow: /files/ Disallow: /host/ Disallow: /hoverbox/ Disallow: /pm/ Disallow: /temp-rey/ Disallow: /wp_old/ Disallow: /*?* Disallow: /iframes/ Disallow: /recommends/ # Files Disallow: /*.php$ Disallow: /*.js$ Disallow: /*.inc$ Disallow: /*.css$ Disallow: /*.gz$ Disallow: /*.wmv$ Disallow: /*.cgi$ Disallow: /*.xhtml$ User-agent: Mediapartners-Google* Disallow: /*?* Allow: /z/ Allow: /about/ Allow: /contact/ Allow: /wp-content/ Allow: /tag/ Allow: /manual/* Allow: /docs/* Allow: /*.php$ Allow: /*.js$ Allow: /*.inc$ Allow: /*.css$ Allow: /*.gz$ Allow: /*.cgi$ Allow: /*.wmv$ Allow: /*.cgi$ Allow: /*.xhtml$ Allow: /*.php* Allow: /*.gif$ Allow: /*.jpg$ Allow: /*.png$ # disallow archiving site User-agent: ia_archiver Disallow: / # disable duggmirror User-agent: duggmirror Disallow: /