# For all robots User-agent: * Disallow: # Block access to specific groups of pages Disallow: /college/us/cart Disallow: /college/us/checkout Disallow: /college/us/my-account Disallow: /college/us/termsOfUse* Request-rate: 1/10 # maximum rate is one page every 10 seconds Crawl-delay: 10 # 10 seconds between page requests Visit-time: 0400-0845 # only visit between 04:00 and 08:45 UTC # Allow search crawlers to discover the sitemap Sitemap: https://www.macmillanlearning.com/college/us/sitemap.xml Sitemap: https://www.macmillanlearning.com/college/ca/sitemap.xml # Block CazoodleBot as it does not present correct accept content headers User-agent: CazoodleBot Disallow: / # Block MJ12bot as it is just noise User-agent: MJ12bot Disallow: / # Block dotbot as it cannot parse base urls properly User-agent: dotbot/1.0 Disallow: / # Block Gigabot User-agent: Gigabot Disallow: / # Block searchText and PreviewLabel string Disallow: */*?searchText=* Disallow: */*?PreviewLabel=* #Block access to specific groups of pages Disallow: /college/us/login* Disallow: /college/ca/login*