# Robots.txt for heijmerikx.com User-agent: * Allow: / # Block admin and authentication paths Disallow: /mng/ Disallow: /login Disallow: /api/ # Block client portal (private galleries) Disallow: /client/ # --------------------------------------------------------------------------- # AI training crawlers — disallowed entirely. # Photographs and editorial content on this site are not licensed for use as # training data for generative AI models. Citation/search crawlers (Googlebot, # Bingbot, PerplexityBot, ChatGPT-User, OAI-SearchBot, Applebot, etc.) are NOT # listed here and inherit the rules under "User-agent: *" above, so they are # free to crawl and cite the site. # --------------------------------------------------------------------------- User-agent: GPTBot Disallow: / User-agent: Google-Extended Disallow: / User-agent: anthropic-ai Disallow: / User-agent: ClaudeBot Disallow: / User-agent: Claude-Web Disallow: / User-agent: cohere-ai Disallow: / User-agent: cohere-training-data-crawler Disallow: / User-agent: CCBot Disallow: / User-agent: Applebot-Extended Disallow: / User-agent: FacebookBot Disallow: / User-agent: Meta-ExternalAgent Disallow: / User-agent: Bytespider Disallow: / User-agent: PetalBot Disallow: / User-agent: Diffbot Disallow: / User-agent: omgili Disallow: / User-agent: omgilibot Disallow: / User-agent: ImagesiftBot Disallow: / # Sitemap Sitemap: https://heijmerikx.com/sitemap.xml