robots.txt details

saved: size: 2505 kb md5 checksum: 671a77647ff168fb3fe9015b6bef6205

websites using this robots.txt

content


#
# robots.txt 2023-03-21
#
# This file is to prevent the crawling and indexing of certain parts
# of your site by web crawlers and spiders run by sites like Yahoo!
# and Google. By telling these "robots" where not to go on your site,
# you save bandwidth and server resources.
#
# This file will be ignored unless it is at the root of your host:
# Used:    http://example.com/robots.txt
# Ignored: http://example.com/site/robots.txt
#
# For more information about the robots.txt standard, see:
# http://www.robotstxt.org/robotstxt.html

User-agent: *
User-agent: Googlebot
User-agent: Googlebot-News
User-agent: Googlebot-Image
User-agent: Googlebot-Video
User-agent: Googlebot-Mobile
User-agent: Twitterbot
Disallow: /files/

User-agent: UbiCrawler
Disallow: /

User-agent: DOC
Disallow: /

User-agent: Zao
Disallow: /

User-agent: sitecheck.internetseer.com
Disallow: /

User-agent: Zealbot
Disallow: /

User-agent: MSIECrawler
Disallow: /

User-agent: SiteSnagger
Disallow: /

User-agent: WebStripper
Disallow: /

User-agent: WebCopier
Disallow: /

User-agent: Fetch
Disallow: /

User-agent: Offline Explorer
Disallow: /

User-agent: Teleport
Disallow: /

User-agent: TeleportPro
Disallow: /

User-agent: WebZIP
Disallow: /

User-agent: linko
Disallow: /

User-agent: HTTrack
Disallow: /

User-agent: Microsoft.URL.Control
Disallow: /

User-agent: Xenu
Disallow: /

User-agent: larbin
Disallow: /

User-agent: libwww
Disallow: /

User-agent: ZyBORG
Disallow: /

User-agent: Download Ninja
Disallow: /

#
# la mayoria de veces causa problemas
#

User-agent: wget
Disallow: /

User-agent: grub-client
Disallow: /

User-agent: k2spider
Disallow: /

User-agent: NPBot
Disallow: /

User-agent: WebReaper
Disallow: /
 
Sitemap: https://www.eluniversal.com.mx/arc/outboundfeeds/news/?outputType=xml
Sitemap: https://www.eluniversal.com.mx/arc/outboundfeeds/general/?outputType=xml
Sitemap: https://www.eluniversal.com.mx/sitemaps/web/nacion/?outputType=xml
Sitemap: https://www.eluniversal.com.mx/sitemaps/web/elecciones/?outputType=xml
Sitemap: https://www.eluniversal.com.mx/sitemaps/web/metropoli/?outputType=xml
Sitemap: https://www.eluniversal.com.mx/sitemaps/web/edomex/?outputType=xml
Sitemap: https://www.eluniversal.com.mx/sitemaps/web/estados/?outputType=xml
Sitemap: https://www.eluniversal.com.mx/sitemaps/web/opinion/?outputType=xml
Sitemap: https://www.eluniversal.com.mx/sitemaps/web/deportes/?outputType=xml
Sitemap: https://www.eluniversal.com.mx/sitemaps/web/ciencia-y-salud/?outputType=xml