User-agent: * Allow: / Disallow: */language/switch/to/0?redirect= Disallow: */language/switch/to/1?redirect= Disallow: /app_link_redirector.php Disallow: */blog/wp-admin Disallow: */redirect?url= Disallow: */news/feeds Disallow: /blog/tag/*/feed/ Disallow: /*?token= Disallow: /*?exit= # For Organization Disallow: /organization Disallow: /organization/* # Daily event pages (no search indexing / ranking) Disallow: /daily-event/ Disallow: /en/daily-event/ Disallow: /talk-with-us?t= Disallow: /subscription?token= Disallow: /subscription-packages?token= Disallow: /paramarsha?token= Disallow: /paramarsha/1?token= # Disallow old/deleted sitemap URLs Disallow: /sitemap-bs-dates.xml Disallow: /sitemap-bs-dates-panchanga.xml Disallow: /sitemap-bs-year-month.xml Disallow: /sitemap-bs-year.xml Disallow: /sitemap-ad-year.xml Disallow: /sitemap-ad-dates.xml Disallow: /sitemap-ad-year-month.xml Disallow: /sitemaps/default-sitemap.xml Disallow: /sitemaps/en-sitemap.xml Disallow: /sitemaps/en-sitemap-ad-dates.xml Disallow: /sitemaps/sitemap-ad-dates.xml Disallow: /sitemaps/sitemap-ad-year.xml Disallow: /sitemaps/sitemap-ad-year-month.xml Disallow: /sitemaps/sitemap-bs-dates.xml Disallow: /sitemaps/sitemap-bs-dates-panchanga.xml Disallow: /sitemaps/sitemap-bs-year.xml Disallow: /sitemaps/sitemap-bs-year-month.xml Disallow: /radios.xml # =========================================== # AI Training Crawlers - BLOCKED # These bots scrape content to train AI models # with no attribution or referral traffic. # =========================================== User-agent: GPTBot Disallow: / User-agent: Google-Extended Disallow: / User-agent: ClaudeBot Disallow: / User-agent: anthropic-ai Disallow: / User-agent: CCBot Disallow: / User-agent: Bytespider Disallow: / User-agent: Meta-ExternalAgent Disallow: / User-agent: Meta-ExternalFetcher Disallow: / User-agent: cohere-ai Disallow: / User-agent: Google-CloudVertexBot Disallow: / # =========================================== # AI Citation Crawlers - ALLOWED # These bots fetch content in real-time and # cite nepalipatro.com.np with source links, # driving referral traffic back to the site. # =========================================== User-agent: ChatGPT-User Allow: / User-agent: OAI-SearchBot Allow: / User-agent: PerplexityBot Allow: / User-agent: Perplexity-User Allow: / User-agent: Claude-SearchBot Allow: / User-agent: Claude-User Allow: / User-agent: DuckAssistBot Allow: / User-agent: Applebot-Extended Allow: / User-agent: Amazonbot Allow: / # Current sitemaps Sitemap: https://nepalipatro.com.np/sitemap.xml Sitemap: https://nepalipatro.com.np/radios-index.xml