robots.txt details

saved: size: 1332 kb md5 checksum: fb87af14ff8a95c10510c59389124e68

websites using this robots.txt

content


# $Id: robots.txt,v 1.9.2.1 2008/12/10 20:12:19 goba Exp $
#
# robots.txt
#
# This file is to prevent the crawling and indexing of certain parts
# of your site by web crawlers and spiders run by sites like Yahoo!
# and Google. By telling these "robots" where not to go on your site,
# you save bandwidth and server resources.
#
# This file will be ignored unless it is at the root of your host:
# Used:    http://example.com/robots.txt
# Ignored: http://example.com/site/robots.txt
#
# For more information about the robots.txt standard, see:
# http://www.robotstxt.org/wc/robots.html
#
# For syntax checking, see:
# http://www.sxw.org.uk/computing/robots/check.html

# Disallow all crawlers access to certain pages.
User-agent: *
# Directories
Disallow: /content/user/
Disallow: /popup/
Disallow: /content/sites/default/files/downloads/
Disallow: /alert/
Disallow: /userAccount/
Disallow: /settings/
Disallow: /usageStatistics/
Disallow: /payment/
Disallow: /mediaReport/
Disallow: /toc_list/
Disallow: /admin/
Disallow: /logout/
Disallow: /noAccess/
Disallow: /sourceInformation/
# managed via nofollow-meta-tag in application "Disallow: /dosearch/"
# managed via nofollow-meta-tag in application "Disallow: /dosearch"
Disallow: /document/
Disallow: /document
Disallow: /formEngine/doAction
Disallow: /snoopio/
Disallow: /snoopio