# $Id: robots.txt,v 1.9.2.1 2008/12/10 20:12:19 goba Exp $ # # robots.txt # # This file is to prevent the crawling and indexing of certain parts # of your site by web crawlers and spiders run by sites like Yahoo! # and Google. By telling these "robots" where not to go on your site, # you save bandwidth and server resources. # # For more information about the robots.txt standard, see: # http://www.robotstxt.org/wc/robots.html # # For syntax checking, see: # http://www.sxw.org.uk/computing/robots/check.html User-agent: Slurp User-agent: Googlebot Crawl-delay: 5 # MAGENTO Disallow: /404/ Disallow: /app/ Disallow: /downloader/ Disallow: /js/ Disallow: /lib/ Disallow: /media/ Disallow: /pkginfo/ Disallow: /report/ Disallow: /skin/ Disallow: /var/ Disallow: /cron.php Disallow: /install.php Disallow: /pear # Directories Disallow: /company/includes/ Disallow: /company/misc/ Disallow: /company/modules/ Disallow: /company/profiles/ Disallow: /company/scripts/ Disallow: /company/sites/ Disallow: /company/themes/ # Files Disallow: /company/CHANGELOG.txt Disallow: /company/cron.php Disallow: /company/INSTALL.mysql.txt Disallow: /company/INSTALL.pgsql.txt Disallow: /company/install.php Disallow: /company/INSTALL.txt Disallow: /company/LICENSE.txt Disallow: /company/MAINTAINERS.txt Disallow: /company/update.php Disallow: /company/UPGRADE.txt Disallow: /company/xmlrpc.php # Paths (clean URLs) Disallow: /company/admin/ Disallow: /company/comment/reply/ Disallow: /company/logout/ Disallow: /company/node/add/ Disallow: /company/search/ Disallow: /company/user/register/ Disallow: /company/user/password/ Disallow: /company/user/login/ # Paths (no clean URLs) Disallow: /company/?q=admin/ Disallow: /company/?q=comment/reply/ Disallow: /company/?q=contact/ Disallow: /company/?q=logout/ Disallow: /company/?q=node/add/ Disallow: /company/?q=search/ Disallow: /company/?q=user/password/ Disallow: /company/?q=user/register/ Disallow: /company/?q=user/login/ #if not yahoo/google then don't crawl User-agent: * Disallow: /