################################################## # Vanilla-wide rules # ################################################## User-agent: * # Common path patterns (* prefix to handle localisation) Disallow: */deals/compare Disallow: */html/ Disallow: */p/*/embed/captioned Disallow: */outlink* # Common query string patterns Disallow: *searchTerm=* Disallow: *sortBy=* Disallow: *productBrand=* Disallow: *%7B*%7D* Disallow: *seenMatchId=* # Infinite scroll paths Disallow: /infinite-scroll-article/* Disallow: /infinite-scroll-review/* Disallow: /infinite-scroll-recipe/* # AI crawlers User-agent: bytespider User-agent: mistralai User-agent: cohere User-agent: ai2bot User-agent: youbot User-agent: omgili User-agent: diffbot User-agent: kangaroo User-agent: img2dataset User-agent: amazonbot User-agent: amazon-qbusiness User-Agent: meta-externalagent User-Agent: meta-webindexer Disallow: / ################################################## # Site-specific rules # ################################################## User-Agent: * Disallow: /search Disallow: /*searchTerm Disallow: /deals/compare Disallow: /shop* Disallow: /*productBrand Disallow: *jwsource=* Sitemap: https://theweekjunior.co.uk/sitemap.xml Sitemap: https://sciencenature.theweekjunior.co.uk/sitemap.xml ################################################## # Sitemaps # ################################################## User-agent: * Sitemap: https://theweekjunior.co.uk/sitemap.xml Sitemap: https://theweekjunior.co.uk/sitemap-news.xml