User-agent: * Crawl-delay: 10 # ------------------------------------ # 2.1 Default behavior # ------------------------------------ # By default, all public pages are allowed. Allow: / Disallow # ============================== # Full access for QualifiedBot # ============================== User-agent: QualifiedBot Allow: / # ------------------------------------ # 2.2 System / admin / user pages # ------------------------------------ Disallow: /admin/ Disallow: /comment/ Disallow: /comment/reply/ Disallow: /user/register Disallow: /user/password Disallow: /user/login Disallow: /user/logout Disallow: /search/* Disallow: /search/node/ # If your site uses "node" or "taxonomy" URLs publicly, # review these rules before keeping them. Disallow: */node/* Disallow: */taxonomy/* Disallow: /pr-category/ # Custom internal sections (review if they contain SEO content) Disallow: /business-need/ Disallow: /users/ Disallow: /eskcluser/ Disallow: /sites/default/files/styles/ # ------------------------------------ # 2.3 Technical / maintenance scripts # ------------------------------------ Disallow: /cron.php Disallow: /install.php Disallow: /update.php Disallow: /xmlrpc.php # Legacy / documentation / changelogs Disallow: /README.md Disallow: /CHANGELOG.txt Disallow: /INSTALL.txt Disallow: /INSTALL.mysql.txt Disallow: /INSTALL.pgsql.txt Disallow: /INSTALL.sqlite.txt Disallow: /LICENSE.txt Disallow: /MAINTAINERS.txt Disallow: /UPGRADE.txt Disallow: /modules/README.txt Disallow: /sites/README.txt Disallow: /themes/README.txt Disallow: /web.config # Old RSS endpoints (if not used anymore) Disallow: /rss.asp Disallow: /rss.xml # ------------------------------------ # 2.4 Legacy / no-clean URLs # ------------------------------------ Disallow: /index.php/admin/ Disallow: /index.php/comment/reply/ Disallow: /index.php/filter/tips Disallow: /index.php/node/add/ Disallow: /index.php/search/ Disallow: /index.php/user/password Disallow: /index.php/user/register Disallow: /index.php/user/login Disallow: /index.php/user/logout Disallow: /index.php/media/oembed Disallow: /index.php/*/media/oembed Disallow: /?q=admin/ Disallow: /?q=comment/reply/ Disallow: /?q=filter/tips/ Disallow: /?q=node/add/ Disallow: /?q=search/ Disallow: /?q=user/password/ Disallow: /?q=user/register/ Disallow: /?q=user/login/ Disallow: /?q=user/logout/ Disallow: /?q=taxonomy/ # ------------------------------------ # 2.5 URL parameters / filters / tracking # These rules help reduce duplicate content caused by query parameters. # ------------------------------------ # Generic search parameter Disallow: /*?search= # Common content filters / faceted navigation Disallow: /*?title* Disallow: /*?page* Disallow: /*?resource_type* Disallow: /resources/*?resource_type* Disallow: /*?nid_entityreference_filter* Disallow: /*?field_pr_category_tid* Disallow: /*?field_tab_label_value* Disallow: /*?field_team_category_tid* Disallow: /*?field_business_need_tid* Disallow: /*?field_job_* Disallow: /*?field_field_* # Tracking / campaign parameters Disallow: /*?utm_ # Example kept from older config: # Disallow: /*?utm_source*