# # robots.txt # # This file is to prevent the crawling and indexing of certain parts # of your site by web crawlers and spiders run by sites like Yahoo! # and Google. By telling these "robots" where not to go on your site, # you save bandwidth and server resources. # # This file will be ignored unless it is at the root of your host: # Used: http://example.com/robots.txt # Ignored: http://example.com/site/robots.txt # # For more information about the robots.txt standard, see: # http://www.robotstxt.org/robotstxt.html # # For syntax checking, see: # http://www.frobee.com/robots-txt-check Sitemap: http://www.yourtango.com/sitemap Sitemap: http://www.yourtango.com/sitemap.xml User-agent: Mediapartners-Google Disallow: User-agent: * Crawl-delay: 5 # Directories Disallow: /feed/ Disallow: /experts/user-login Disallow: /experts/user-register Disallow: /experts/search Disallow: /experts/search/ Disallow: /taxonomy/term/ Disallow: /7181/ Disallow: /prouser/ Disallow: /print/ Disallow: /printmail/ Disallow: /popup/ Disallow: /fb_cb/ Disallow: /archive/ Disallow: /forward/ Disallow: /node-comment/ Disallow: /includes/ Disallow: /misc/ Disallow: /modules/ Disallow: /profiles/ Disallow: /scripts/ Disallow: /sites/all Disallow: /sites/default/default.settings.php Disallow: /sites/default/settings.php Disallow: /themes/ Disallow: /plugins/feedback.php # Files Disallow: /CHANGELOG.txt Disallow: /cron.php Disallow: /social-share-cron.php Disallow: /INSTALL.mysql.txt Disallow: /INSTALL.pgsql.txt Disallow: /install.php Disallow: /INSTALL.txt Disallow: /LICENSE.txt Disallow: /MAINTAINERS.txt Disallow: /update.php Disallow: /UPGRADE.txt Disallow: /xmlrpc.php # Paths (clean URLs) Disallow: /admin/ Disallow: /users/ Disallow: /user/ Disallow: /comment/reply/ Disallow: /contact/ Disallow: /logout/ Disallow: /node/add/ Disallow: /search/ Disallow: /user/register/ Disallow: /user/password/ Disallow: /user/login/ #Fixes for slow crawl Disallow: /hybridauth/ # Paths (no clean URLs) Disallow: /?q=admin/ Disallow: /?q=comment/reply/ Disallow: /?q=contact/ Disallow: /?q=logout/ Disallow: /?q=node/add/ Disallow: /?q=search/ Disallow: /?q=user/password/ Disallow: /?q=user/register/ Disallow: /?q=user/login/ Disallow: *gadcreatives.glam.com* Disallow: *gadcreatives.mode.com* #Fixes for slow crawl Disallow: /?q=hybridauth/ #Allow Specific URLs Allow: /sites/all/themes/pinkduck/images/sprite* Allow: /sites/all/themes/pinkduck/i/* Allow: /sites/all/themes/ytresponsive/* Allow: /users/radar-online #Fixes for slow crawl Allow: /sites/all/themes/ytpurple/* Allow: /*/*.css Allow: /*/*.js Allow: /*/*.gif Allow: /*/*.jpg Allow: /*/*.jpeg Allow: /*/*.png Allow: /*/*.svg Allow: /sites/all/*/*.css Allow: /sites/all/*/*.js Allow: /sites/all/*/*.gif Allow: /sites/all/*/*.jpg Allow: /sites/all/*/*.jpeg Allow: /sites/all/*/*.png Allow: /sites/all/*/*.svg #Fixes for old sitemap index links Disallow: /sitemap-*.xml Allow: /sitemap.xml Allow: /sitemap Allow: /sitemap/* # allow boomtrain bot on entire site User-agent: Boomtrain-Content-Bot* Disallow: Allow: /*