User-agent: * Allow: / # Enhanced SEO Sitemap locations - Updated for blog system Sitemap: https://www.himanshurawat.in/sitemap.xml Sitemap: https://www.himanshurawat.in/sitemap.html # Optimize crawling for better indexing - Blog-optimized crawl delay Crawl-delay: 1 # Allow specific file types for better resource discovery Allow: *.css Allow: *.js Allow: *.png Allow: *.jpg Allow: *.jpeg Allow: *.svg Allow: *.pdf Allow: *.mp4 Allow: *.webp Allow: *.webm Allow: *.ico Allow: *.gif # SEO-friendly pages allowed Allow: /about Allow: /projects Allow: /contact Allow: /projects/* Allow: /articles Allow: /articles/* # Blog and article-specific optimizations Allow: /articles/modi-social-media-independence-day-2025 Allow: /articles/react-development-2025 Allow: /articles?topic=* # RSS feed (if implemented in future) Allow: /feed.xml Allow: /rss.xml # Disallow development/build files and sensitive directories Disallow: /build/ Disallow: /src/ Disallow: /node_modules/ Disallow: /.git/ Disallow: /.env Disallow: /config/ Disallow: /temp/ Disallow: /cache/ Disallow: /admin/ Disallow: /test/ Disallow: /tests/ Disallow: /scripts/ Disallow: /docs/ Disallow: /backups/ # Allow blog-related assets but protect source files Allow: /public/ Allow: /assets/ Disallow: /src/assets/ Disallow: /src/components/ Disallow: /src/pages/ Disallow: /src/data/ # Allow search engines to access important metadata Allow: /manifest.json Allow: /robots.txt Allow: /sitemap.xml Allow: /sitemap.html # Specific bot optimizations User-agent: Googlebot Allow: / Crawl-delay: 1 User-agent: Bingbot Allow: / Crawl-delay: 2 User-agent: LinkedInBot Allow: / Allow: /about Allow: /projects User-agent: FacebookExternalHit Allow: / Allow: /about Allow: /projects # Enhanced sitemap reference for international targeting # Note: Add hreflang variations when multi-language support is implemented Disallow: /node_modules/ Disallow: /src/ Disallow: /.git/ Disallow: /dist/ Disallow: *.log