1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36
|
#
# robots_allow.txt.erb - Generated robots.txt file
#
#
# For all robots
User-agent: *
# Block access to specific groups of pages
Disallow: /cart
Disallow: /checkout
Disallow: /my-account
Request-rate: 1/10 # maximum rate is one page every 10 seconds
Crawl-delay: 10 # 10 seconds between page requests
Visit-time: 0400-0845 # only visit between 04:00 and 08:45 UTC
# Allow search crawlers to discover the sitemap
Sitemap: https://www.hobbylobby.com/sitemap.xml
# Block CazoodleBot as it does not present correct accept content headers
User-agent: CazoodleBot
Disallow: /
# Block MJ12bot as it is just noise
User-agent: MJ12bot
Disallow: /
# Block dotbot as it cannot parse base urls properly
User-agent: dotbot
Disallow: /
# Block Gigabot
User-agent: Gigabot
Disallow: /
|