petersvegrup
12/8/2015 - 12:54 PM

Magento robots.txt

robots.txt template

# eValent 2015-2
#
# robots.txt
#
# This file is to prevent the crawling and indexing of certain parts
# of your site by web crawlers and spiders run by sites like Yahoo!
# and Google. By telling these “robots” where not to go on your site,
# you save bandwidth and server resources.
#
# For more information about the robots.txt standard, see:
# http://www.robotstxt.org/wc/robots.html
#
# For syntax checking, see:
# http://www.sxw.org.uk/computing/robots/check.html


## GENERAL SETTINGS

## Enable robots.txt rules for all crawlers
User-agent: *
Crawl-delay: 10

# Website Sitemap
Sitemap: http://www.example.com/sitemap.xml


## GENERAL MAGENTO SETTINGS

## Allowable Index
Allow: /*?p=
#Allow: /index.php/blog/
Allow: /catalog/seo_sitemap/category/
Allow: /media/catalog/

## Do not crawl common Magento technical folders
Disallow: /404/
Disallow: /admin/
Disallow: /app/
Disallow: /cgi-bin/
Disallow: /downloader/
Disallow: /errors/
Disallow: /includes/
#Disallow: /js/
Disallow: /lib/
#Disallow: /media/
Disallow: /pkginfo/
Disallow: /shell/
#Disallow: /skin/
Disallow: /var/

## Do not crawl common Magento files
Disallow: /api.php
Disallow: /cron.php
Disallow: /cron.sh
Disallow: /get.php
Disallow: /install.php
Disallow: /LICENSE.html
Disallow: /LICENSE.txt
Disallow: /LICENSE_AFL.txt
#Disallow: /*.js$
#Disallow: /*.css$
Disallow: /*.php$

## Paths (clean URLs)
Disallow: /control/
Disallow: /contacts/
Disallow: /customer/
Disallow: /customize/
Disallow: /newsletter/
Disallow: /poll/
Disallow: /review/
Disallow: /sendfriend/
Disallow: /tag/
Disallow: /wishlist/
Disallow: /catalog/product/gallery/

## Do not crawl Magento extension/blog folders
#Disallow: /wp/


## MAGENTO SEO IMPROVEMENTS

## Do not crawl sub category pages that are sorted or filtered.
Disallow: /*?dir*
Disallow: /*?dir=desc
Disallow: /*?dir=asc
Disallow: /*?limit=all
Disallow: /*?mode*

## Do not crawl 2-nd home page copy
Disallow: /index.php/

## Do not crawl links with session IDs
Disallow: /*?SID=
Disallow: /*PHPSESSID

## Do not crawl magento system paths
Disallow: /catalogsearch/
Disallow: /catalog/product_compare/
Disallow: /catalog/category/view/
Disallow: /catalog/product/view/
Disallow: /checkout/
Disallow: /contacts/
Disallow: /customer/
Disallow: /customer/account/
Disallow: /customer/account/login/
Disallow: /wishlist/
Disallow: /tag/
Disallow: /sendfriend/
Disallow: /poll/
Disallow: /newsletter/


## DEVELOPMENT RELATED SETTINGS

## Do not crawl development files and folders
Disallow: /.git/
Disallow: .gitignore
Disallow: .sql
Disallow: .tgz
Disallow: /.idea/
Disallow: /.modman/