# Default rule for all well-behaved crawlers. User-agent: * Disallow: Disallow: /communities Disallow: /communities/create Disallow: /community/ # Search engines that we want to keep indexing the site. User-agent: Googlebot Allow: / User-agent: Googlebot-Image Allow: / User-agent: Googlebot-Video Allow: / User-agent: Bingbot Allow: / User-agent: DuckDuckBot Allow: / User-agent: YandexBot Allow: / # Semrush SEO / Site Audit crawlers (not used here; reduce unnecessary crawl load). User-agent: SemrushBot Disallow: / User-agent: SemrushBot-SA Disallow: / # AI-training crawlers: block entirely. # Backed up by Cloudflare WAF rules; robots.txt is best-effort. User-agent: GPTBot Disallow: / User-agent: ChatGPT-User Disallow: / User-agent: OAI-SearchBot Disallow: / User-agent: ClaudeBot Disallow: / User-agent: Claude-Web Disallow: / User-agent: anthropic-ai Disallow: / User-agent: cohere-ai Disallow: / User-agent: Amazonbot Disallow: / User-agent: meta-externalagent Disallow: / User-agent: FacebookBot Disallow: / User-agent: Bytespider Disallow: / User-agent: PerplexityBot Disallow: / User-agent: CCBot Disallow: / User-agent: Diffbot Disallow: / User-agent: ImagesiftBot Disallow: / User-agent: Omgili Disallow: / User-agent: Omgilibot Disallow: / User-agent: Applebot-Extended Disallow: / User-agent: Google-Extended Disallow: / User-agent: Google-CloudVertexBot Disallow: / User-agent: GoogleOther Disallow: / User-agent: YouBot Disallow: / User-agent: Timpibot Disallow: / User-agent: Scrapy Disallow: / Sitemap: https://www.kasarosa.tv/sitemap.xml