User-agent: * Allow: / # Sitemap Sitemap: https://www.pypestream.ai/sitemap.xml # Disallow admin/internal paths Disallow: /api/ # ─── AI Crawlers (Answer Engine Optimization) ─────────────────────────────── # Explicitly allow all major AI training and retrieval crawlers # OpenAI / ChatGPT User-agent: GPTBot Allow: / # OpenAI browsing plugin User-agent: ChatGPT-User Allow: / # OpenAI retrieval crawler (used by ChatGPT search and Bing integration) User-agent: OAI-SearchBot Allow: / # Anthropic / Claude User-agent: ClaudeBot Allow: / User-agent: anthropic-ai Allow: / # Google Gemini / AI Overviews User-agent: Google-Extended Allow: / # Perplexity AI User-agent: PerplexityBot Allow: / # Meta AI User-agent: FacebookBot Allow: / # Apple User-agent: Applebot-Extended Allow: / # Common Crawl (used by many LLM training datasets) User-agent: CCBot Allow: / # Cohere User-agent: cohere-ai Allow: / # Mistral User-agent: MistralAI-User Allow: / # You.com User-agent: YouBot Allow: / # Brave Search User-agent: Brave Allow: / # Microsoft Copilot / Bing AI User-agent: bingbot Allow: / User-agent: msnbot Allow: / # Amazon Alexa User-agent: Amazonbot Allow: / # Applebot User-agent: Applebot Allow: /