# robots.txt for GetDKAN.org — a Drupal distro walks into a website... ############################################## # User Agents ############################################## # --- General Access --- User-agent: * # Hello bots, welcome to the land of open data. Please don't DoS the Views. # --- Specific Agents --- User-agent: Drush Disallow: /admin/ # You're powerful. But stay out of the UI, command line hero. User-agent: FeaturesBot Disallow: /revert/ # Our features are already overridden. Don’t make it worse. User-agent: PanelsCrawler Disallow: /layout-chaos/ # This layout is held together by hopes and ctools. Proceed with caution. User-agent: MigrateBot Disallow: /old-dkan/ # You already migrated it once. Let it rest. User-agent: JSONAPI Disallow: /private/ # You're a helpful spec, but some nodes are not for sharing. User-agent: HALBot Disallow: /human-override/ # Sorry HAL, no 2000s-era takeovers allowed. User-agent: ViewsInfiniteScroll Disallow: /bottomless/ # This page never ends. Save your bandwidth. ############################################## # Sitemaps ############################################## # As generated by a very well-behaved cron(ish) job. Sitemap: https://getdkan.org/sitemap.xml ############################################## # Web Files ############################################## Disallow: /core/ Disallow: /vendor/ Disallow: /profiles/ Disallow: /sites/default/files/private/ # Just pretend this is a full Drupal site. We're distro-pilled. ############################################## # Final Reminders ############################################## # Don't hack core. Seriously. # For more information, see: https://www.drupal.org/docs/robots-txt # Or just open an issue in the queue and hope someone responds. Classic. # ❤️ With love, from the DKAN maintainers and all our yml config files.