# https://www.robotstxt.org/robotstxt.html
# This is for any additional robots directives
# Allow all search engines to index everything
User-agent: *
Allow: /
# Specific rules for major search engines
User-agent: Googlebot
Allow: /
Crawl-delay: 0
User-agent: Bingbot
Allow: /
Crawl-delay: 1
User-agent: Slurp
Allow: /
Crawl-delay: 1
# Block problematic bots
User-agent: AhrefsBot
Disallow: /
User-agent: MJ12bot
Disallow: /
User-agent: DotBot
Disallow: /
# Medical website specific - block scraping bots
User-agent: ia_archiver
Disallow: /
User-agent: ScrapyBot
Disallow: /
# Block access to development and system files
Disallow: /api/
Disallow: /_next/
Disallow: /out/
Disallow: /.next/
Disallow: /node_modules/
Disallow: /admin/
Disallow: /private/
Disallow: /*?*utm_*
Disallow: /*?*fbclid*
Disallow: /*?*gclid*
Disallow: /*?*ref=*
Disallow: /*?*source=*
# Allow important assets for SEO
Allow: /logo.webp
Allow: /doctors/
Allow: /building/
Allow: /*.css
Allow: /*.js
Allow: /*.webp
Allow: /*.jpg
Allow: /*.png
Allow: /*.svg
Allow: /manifest.json
Allow: /favicon.ico
# Crawl-delay for server health
Crawl-delay: 1
# Sitemap locations (multiple formats for better indexing)
Sitemap: https://eastgate.com.na/sitemap.xml
# Host directive (helps with canonicalization)
Host: https://eastgate.com.na
# Contact information for webmasters
# Contact: info@eastgate.com.na