Magento ROBOTS.TXT to have proper crawling based on our needs

## Website Sitemap
# Sitemap: http://www.example.com/sitemap.xml

## Crawlers Setup
User-agent: *
# Crawl-delay: 30

## Do not crawl common Magento folders
Disallow: /app/
Disallow: /downloader/
Disallow: /errors/
Disallow: /includes/
Disallow: /lib/
Disallow: /pkginfo/
Disallow: /shell/
Disallow: /var/
 
## Do not crawl common Magento files
Disallow: /api.php
Disallow: /cron.php
Disallow: /cron.sh
Disallow: /error_log
Disallow: /get.php
Disallow: /install.php
Disallow: /php.ini.sample
Disallow: /index.php.sample
Disallow: /LICENSE.html
Disallow: /LICENSE.txt
Disallow: /LICENSE_EE.html
Disallow: /LICENSE_EE.txt
Disallow: /LICENSE_AFL.txt
Disallow: /README.txt
Disallow: /RELEASE_NOTES.txt

## Do not crawl pages that are sorted/filtered or paginated with extra params
Disallow: /*?dir=
Disallow: /*?limit=
Disallow: /*?mode=
Disallow: /*?p=*&

## Do not crawl homepage copies 
Disallow: /home
## Uncomment the below only if SEO Url rewrites are activated
# Disallow: /index.php/

## Do not crawl links with session IDs and not clean Urls
Disallow: /*?SID=
Disallow: /*.js$
Disallow: /*.css$
Disallow: /*.php$

## Do not crawl checkout and customer account pages
Disallow: /checkout/
Disallow: /checkout/cart/
Disallow: /checkout/cart/add/
Disallow: /onestepcheckout/
Disallow: /customer/
Disallow: /customer/account/
Disallow: /customer/account/login/

## Do not crawl seach pages and not-SEO optimized catalog links
Disallow: /catalogsearch/
Disallow: /catalogsearch/advanced/
Disallow: /catalogsearch/advanced/result/
Disallow: /catalogsearch/term/
Disallow: /catalogsearch/term/popular/
Disallow: /catalog/product_compare/
Disallow: /catalog/category/view/
Disallow: /catalog/product/view/

## Do not crawl not-SEO optimized other links
Disallow: /customize/
Disallow: /newsletter/
Disallow: /poll/
Disallow: /review/
Disallow: /sendfriend/
Disallow: /tag/
Disallow: /wishlist/

## Extra: Uncomment the below if you do not want Google and Bing to index your images
# User-agent: Googlebot-Image
# Disallow: /
# User-agent: msnbot-media
# Disallow: /