# robots.txt for Cresco Landing Page # https://cresco.example.com/robots.txt # General rules for all crawlers User-agent: * Allow: / Disallow: /api/ Disallow: /_astro/ Crawl-delay: 1 # Sitemap location Sitemap: https://cresco.example.com/sitemap.xml # AI Crawlers - Explicitly allow all content # OpenAI GPT crawler User-agent: GPTBot Allow: / Crawl-delay: 1 # ChatGPT user agent User-agent: ChatGPT-User Allow: / # Anthropic Claude crawler User-agent: Claude-Web Allow: / Crawl-delay: 1 # Google AI (Bard/Gemini) User-agent: Google-Extended Allow: / # Common Crawl (used by many AI models) User-agent: CCBot Allow: / # Meta AI User-agent: FacebookBot Allow: / # Bing AI User-agent: Bingbot Allow: / # Perplexity AI User-agent: PerplexityBot Allow: / # Anthropic specific User-agent: Anthropic-AI Allow: / # Additional AI/ML crawlers User-agent: Applebot-Extended Allow: / User-agent: Diffbot Allow: / User-agent: omgili Allow: / # SEO and analytics bots User-agent: Googlebot Allow: / Crawl-delay: 1 User-agent: Googlebot-Image Allow: / User-agent: Googlebot-Mobile Allow: / User-agent: Bingbot Allow: / User-agent: Slurp Allow: / User-agent: DuckDuckBot Allow: / User-agent: Baiduspider Allow: / User-agent: YandexBot Allow: / User-agent: Sogou Allow: / User-agent: Exabot Allow: / # Block known bad bots User-agent: AhrefsBot Disallow: / User-agent: SemrushBot Disallow: / User-agent: MJ12bot Disallow: / User-agent: dotbot Disallow: /