# Meta/Facebook bot throttling (2026-03-24) User-agent: meta-webindexer Crawl-delay: 2 User-agent: meta-externalagent Crawl-delay: 3 # Block AI training crawlers (no return traffic, pure scraping) User-agent: GPTBot Disallow: / User-agent: CCBot Disallow: / User-agent: Google-Extended Disallow: / User-agent: anthropic-ai Disallow: / User-agent: Claude-Web Disallow: / User-agent: ClaudeBot Disallow: / User-agent: Claude-SearchBot Disallow: / User-agent: Bytespider Disallow: / User-agent: cohere-ai Disallow: / Sitemap: https://www.a2zwordfinder.com/sitemap.xml Sitemap: https://www.a2zwordfinder.com/sitemaps/sitemap-index.xml User-agent: * Allow: / Disallow: /cdn-cgi/bm/cv/ Disallow: /cdn-cgi/challenge-platform/ Disallow: /cdn-cgi/images/trace/ Disallow: /cdn-cgi/rum Disallow: /cdn-cgi/scripts/ Disallow: /cdn-cgi/styles/ Disallow: /cdn-fpw/sxg/ # Disallow sensitive and unnecessary areas Disallow: /banners/ Disallow: /pro/ Disallow: /membersOnly/ Disallow: /cgi-bin/ Disallow: /images/ Disallow: /logs/ Disallow: /private/ Disallow: /admin/ Disallow: /tmp/ Disallow: /temp/ Disallow: /*.log$ Disallow: /*.tmp$ Disallow: /backup/ Disallow: /.git/ Disallow: /.htaccess Disallow: /server-status Disallow: /server-info # Disallow crawling of development and utility files Disallow: /*.bak$ Disallow: /config/ Disallow: /dev-tools/ Disallow: /test/ Disallow: /testing/ # Allow popular search engines User-agent: Googlebot Allow: / User-agent: Bingbot Allow: / Crawl-delay: 20 User-agent: bingbot Allow: / Crawl-delay: 20 User-agent: Slurp Allow: / User-agent: DuckDuckBot Allow: / # SEO tool crawlers — rate-limited (heavy scrapers, low reciprocal value) User-agent: SemrushBot Allow: / Crawl-delay: 30 User-agent: AhrefsBot Allow: / Crawl-delay: 30 User-agent: meta-externalagent Disallow: / # Applebot bumped 10→30 on 2026-04-11 — #1 503 offender after 4-lang sitemap expansion User-agent: Applebot Crawl-delay: 30 # Perplexity AI search — rate-limited after 4-lang sitemap expansion 2026-04-11 User-agent: PerplexityBot Crawl-delay: 20 User-agent: Perplexity-User Crawl-delay: 20 # Block all crawlers from aMember membership system Disallow: /amember/ Disallow: /amember/admin/ Disallow: /amember/login Disallow: /amember/signup Disallow: /amember/member Disallow: /amember/aff/