Sitemap: https://www.polymax.co.uk/sitemap/uk/sitemapindex.xml # Ahrefs pulls web pages very fast and has no concern for the speed like Google. # limit them to one page every 3000 seconds # Googles bot do not accept crawl delay, they are now controlled via the search console, so lets not include them in the config. #User-agent: DotBot #User-agent: Googlebot #User-agent: Googlebot-image User-agent: AhrefsBot Crawl-Delay: 120 User-agent: bingbot Crawl-Delay: 320 User-agent: pingdom Crawl-Delay: 320 #User-agent: SemrushBot #Crawl-Delay: 140 # We dont care about russian search, and MJ12 bot is a pest. User-agent: yandex Disallow: / User-Agent: MJ12bot Disallow: / # For all bots, make sure they only crawl what we care about. User-agent: * # Directories Disallow: /404/ Disallow: /app/ Disallow: /cgi-bin/ Disallow: /downloader/ Disallow: /errors/ Disallow: /includes/ #Disallow: /js/ #Disallow: /lib/ Disallow: /magento/ #Disallow: /media/ Disallow: /pkginfo/ Disallow: /report/ Disallow: /scripts/ Disallow: /captcha/ Disallow: /shell/ #Disallow: /skin/ Disallow: /stats/ Disallow: /var/ # Paths (clean URLs) Disallow: /index.php/ Disallow: /catalog/product_compare/ #Disallow: /catalog/category/view/ #Disallow: /catalog/product/view/ Disallow: /catalogsearch/ Disallow: /checkout/ Disallow: /control/ Disallow: /contacts/ Disallow: /customer/ Disallow: /customize/ #Disallow: /newsletter/ Disallow: /poll/ #Disallow: /review/ Disallow: /sendfriend/ Disallow: /tag/ Disallow: /wishlist/ #Disallow: /catalog/product/gallery/ # Files Disallow: /cron.php Disallow: /cron.sh Disallow: /error_log Disallow: /install.php Disallow: /LICENSE.html Disallow: /LICENSE.txt Disallow: /LICENSE_AFL.txt Disallow: /STATUS.txt # Paths (no clean URLs) #Disallow: /*.js$ #Disallow: /*.css$ Disallow: /*.php$ Disallow: /*?SID= #Disallow: /*.pdf$