User-agent: * Allow: / # Sitemap locations (add additional sitemaps as you create them) Sitemap: https://ofallonvets.com/sitemap.xml # Major search engines - prioritize crawling User-agent: Googlebot Allow: / Crawl-delay: 0 User-agent: Bingbot Allow: / Crawl-delay: 0 User-agent: Slurp Allow: / User-agent: DuckDuckBot Allow: / User-agent: YandexBot Allow: / User-agent: Baiduspider Allow: / # AI crawlers for LLMO (Large Language Model Optimization) User-agent: GPTBot Allow: / User-agent: Google-Extended Allow: / User-agent: CCBot Allow: / User-agent: ChatGPT-User Allow: / User-agent: Claude-Web Allow: / User-agent: ClaudeBot Allow: / User-agent: anthropic-ai Allow: / User-agent: PerplexityBot Allow: / User-agent: YouBot Allow: / User-agent: Meta-ExternalAgent Allow: / # Social media crawlers for better social sharing User-agent: facebookexternalhit Allow: / User-agent: Twitterbot Allow: / User-agent: LinkedInBot Allow: / User-agent: WhatsApp Allow: / User-agent: TelegramBot Allow: / # Local business and review crawlers User-agent: AppleBot Allow: / # Academic and research crawlers User-agent: ia_archiver Allow: / # Block aggressive SEO crawlers to reduce server load User-agent: AhrefsBot Disallow: / User-agent: SemrushBot Disallow: / User-agent: MJ12bot Disallow: / User-agent: DotBot Disallow: / User-agent: BLEXBot Disallow: / User-agent: DataForSeoBot Disallow: / User-agent: PetalBot Disallow: / User-agent: SentiBot Disallow: / User-agent: MegaIndex Disallow: / User-agent: LinkpadBot Disallow: / # Block unwanted content scraping and private areas User-agent: * Disallow: /admin/ Disallow: /private/ Disallow: /*.json$ Disallow: /*?print= Disallow: /*&print= Disallow: /*?debug= Disallow: /wp-admin/ Disallow: /cgi-bin/