robots.txt details

e7bc2c677a3ac39624bbacfbf70766d2

saved: | size: 1724kb | checksum: e7bc2c677a3ac39624bbacfbf70766d2

websites using this robots.txt

content




# For all robots
User-agent: *

# Allow search crawlers to discover the sitemap

Sitemap: https://www.mysortimo.fr/static/content/sitemaps/fr/sitemap-fr.xml
Sitemap: https://www.mysortimo.de/static/content/sitemaps/de/sitemap-de.xml
Sitemap: https://www.mysortimo.no/static/content/sitemaps/no/sitemap-no.xml
Sitemap: https://www.mysortimo.nl/static/content/sitemaps/nl/sitemap-nl.xml
Sitemap: https://www.mysortimo.at/static/content/sitemaps/at/sitemap-at.xml
Sitemap: https://www.mysortimo.be/static/content/sitemaps/be/sitemap-be.xml
Sitemap: https://www.mysortimo.com/static/content/sitemaps/com/sitemap-com.xml
Sitemap: https://www.mysortimo.dk/static/content/sitemaps/dk/sitemap-dk.xml
Sitemap: https://www.mysortimo.us/static/content/sitemaps/us/sitemap-us.xml
Sitemap: https://www.mysortimo.se/static/content/sitemaps/se/sitemap-se.xml
Sitemap: https://www.mysortimo.co.uk/static/content/sitemaps/co.uk/sitemap-co.uk.xml
Sitemap: https://www.mysortimo.es/static/content/sitemaps/sitemap-es.xml

# Block access to specific groups of pages
Disallow: /de/robots.txt
Disallow: /de/cart
Disallow: /de/checkout
Disallow: /de/my-account

Request-rate: 1/10 # maximum rate is one page every 10 seconds
Crawl-delay: 10 # 10 seconds between page requests
Visit-time: 0400-0845 # only visit between 04:00 and 08:45 UTC


# Block CazoodleBot as it does not present correct accept content headers
User-agent: CazoodleBot
Disallow: /

# Block MJ12bot as it is just noise
User-agent: MJ12bot
Disallow: /

# Block dotbot as it cannot parse base urls properly
User-agent: dotbot/1.0
Disallow: /

# Block Gigabot
User-agent: Gigabot
Disallow: /