# $Id: robots.txt,v 1.1.5.2 2009/02/28 18:57:07 # # robots.txt for http://www.geekberry.net by Giancarlo Colfer # # This file is to prevent the crawling and indexing of certain parts # of your site by web crawlers and spiders run by sites like Yahoo! # and Google. By telling these "robots" where not to go on your site, # you save bandwidth and server resources. # # This file will be ignored unless it is at the root of your host: # Used: http://example.com/robots.txt # Ignored: http://example.com/site/robots.txt # # For more information about the robots.txt standard, see: # http://www.robotstxt.org/wc/robots.html # # For syntax checking, see: # http://www.sxw.org.uk/computing/robots/check.html #Google Search Engine Robot User-agent: Googlebot # Directories # Files #Allow: /*?$ Disallow: /*? Disallow: /index.php Disallow: /xmlrpc.php Disallow: /wp-cron.php Disallow: /*.php$ Disallow: /*.js$ Disallow: /*.inc$ Disallow: /*.css$ # Paths (clean URLs) Disallow: /wp-admin/ Disallow: /wp-content/ Disallow: /wp-includes/ Disallow: /feed/ Disallow: */feed/ Disallow: /trackback/ Disallow: */trackback/ Disallow: /archives/ Disallow: /author/ Disallow: /page/ Disallow: /tag/ Disallow: /category/ Disallow: /store/ User-agent: Mediapartners-Google* Disallow: /*? #Yahoo! Search Engine Robot User-Agent: Slurp Crawl-delay: 1 Disallow: /*? #Microsoft Search Engine Robot User-Agent: msnbot Crawl-delay: 10 Disallow: /*? # Alexa User-agent: ia_archiver Disallow: /*? User-agent: duggmirror Disallow: /*? # Every bot that might possibly read and respect this file User-agent: * Crawl-delay: 20 # Directories Disallow: /downloads/ # Files #Allow: /*?$ Disallow: /*? Disallow: /index.php Disallow: /xmlrpc.php Disallow: /wp-cron.php Disallow: /*.php$ Disallow: /*.js$ Disallow: /*.inc$ Disallow: /*.css$ # Paths (clean URLs) Disallow: /wp-admin/ Disallow: /wp-content/ Disallow: /wp-includes/ Disallow: /feed/ Disallow: */feed/ Disallow: /trackback/ Disallow: */trackback/ Disallow: /archives/ Disallow: /author/ Disallow: /page/ Disallow: /tag/ Disallow: /category/ Disallow: /store/ # Paths (no clean URLs) #Disallow: /?q=admin/ Sitemap: http://www.geekberry.net/sitemap.xml