# https://omegacentauri.me/robots.txt # The Omega Centauri Society — research / education portal. # Citation is welcome; explicit allow for major search and AI retrieval crawlers. # Last reviewed: 2026-05-11 # ──────────────────────────────────────────────────────────────────── # Default — open to everyone unless overridden below # ──────────────────────────────────────────────────────────────────── User-agent: * Allow: / # ──────────────────────────────────────────────────────────────────── # Major search engines — explicit allow # ──────────────────────────────────────────────────────────────────── User-agent: Googlebot Allow: / User-agent: Googlebot-Image Allow: / User-agent: Bingbot Allow: / User-agent: DuckDuckBot Allow: / User-agent: Applebot Allow: / # ──────────────────────────────────────────────────────────────────── # AI retrieval crawlers — explicit allow. # These are the user-agents most likely to surface citations and # answer-engine references back to omegacentauri.me. We opt IN. # # Note: GPTBot, OAI-SearchBot, and ChatGPT-User are three distinct # user-agents from OpenAI (training, live search, in-chat fetch). # The same split exists for ClaudeBot vs Claude-Web. # ──────────────────────────────────────────────────────────────────── User-agent: GPTBot Allow: / User-agent: OAI-SearchBot Allow: / User-agent: ChatGPT-User Allow: / User-agent: ClaudeBot Allow: / User-agent: Claude-Web Allow: / User-agent: anthropic-ai Allow: / User-agent: PerplexityBot Allow: / User-agent: Perplexity-User Allow: / User-agent: Google-Extended Allow: / User-agent: Applebot-Extended Allow: / User-agent: Meta-ExternalAgent Allow: / User-agent: Meta-ExternalFetcher Allow: / User-agent: Bytespider Allow: / User-agent: CCBot Allow: / User-agent: cohere-ai Allow: / User-agent: Diffbot Allow: / User-agent: YouBot Allow: / User-agent: Amazonbot Allow: / # ──────────────────────────────────────────────────────────────────── # Noisy SEO / competitive-intelligence scrapers — disallow. # These produce no inbound visibility benefit; they only enumerate # the site for third-party SEO dashboards. # ──────────────────────────────────────────────────────────────────── User-agent: AhrefsBot Disallow: / User-agent: SemrushBot Disallow: / User-agent: MJ12bot Disallow: / User-agent: DotBot Disallow: / User-agent: BLEXBot Disallow: / User-agent: PetalBot Disallow: / # ──────────────────────────────────────────────────────────────────── # Sitemap # ──────────────────────────────────────────────────────────────────── Sitemap: https://omegacentauri.me/sitemap.xml