# === SITEMAP === Sitemap: https://www.naturagart.de/export/sitemap.xml # === AI-KRITISCHE RESSOURCEN (EXPLIZITE ALLOWS) === User-agent: * Allow: /llms.txt Allow: /llms-full.txt Allow: /.well-known/ Allow: /sitemap*.xml Allow: /Infos/ Allow: /Teiche/ Allow: /Teichtechnik/ Allow: /Pflanzen/ Allow: /Videos/ Allow: /Naturnah-wohnen/ Allow: /NaturaGart-Park/ Allow: /Tauchpark/ # === STANDARD DISALLOWS === Disallow: /admin/ Disallow: /Core/ Disallow: /tmp/ Disallow: /views/ Disallow: /Setup/ Disallow: /log/ # Disallow: /newsletter/ Disallow: /en/newsletter/ Disallow: /index.php?cl=newsletter # Disallow: /agb/ Disallow: /en/terms/ # Disallow: /warenkorb/ Disallow: /en/cart/ Disallow: /index.php?cl=basket # Disallow: /mein-konto/ Disallow: /en/my-account/ Disallow: /index.php?cl=account # Disallow: /mein-merkzettel/ Disallow: /en/my-wishlist/ Disallow: /index.php?cl=account_noticelist # Disallow: /mein-wunschzettel/ Disallow: /en/my-gift-registry/ Disallow: /index.php?cl=account_wishlist # Disallow: /konto-eroeffnen/ Disallow: /en/open-account/ Disallow: /index.php?cl=register # Disallow: /passwort-vergessen/ Disallow: /en/forgot-password/ Disallow: /index.php?cl=forgotpwd # Disallow: /index.php?cl=moredetails # Disallow: /index.php?cl=review # Disallow: /index.php?cl=search # Disallow: /EXCEPTION_LOG.txt # # wildcards at the end, because of some crawlers see it as errors Disallow: /*?cl=newsletter Disallow: /*&cl=newsletter # Disallow: /*?cl=basket Disallow: /*&cl=basket # Disallow: /*?cl=account Disallow: /*&cl=account # Disallow: /*?cl=account_noticelist Disallow: /*&cl=account_noticelist # Disallow: /*?cl=account_wishlist Disallow: /*&cl=account_wishlist # Disallow: /*?cl=register Disallow: /*&cl=register # Disallow: /*?cl=forgotpwd Disallow: /*&cl=forgotpwd # Disallow: /*?cl=moredetails Disallow: /*&cl=moredetails # Disallow: /*?cl=review Disallow: /*&cl=review # Disallow: /*?cl=search Disallow: /*&cl=search # Disallow: /*&fnc=tobasket Disallow: /*&fnc=tocomparelist Disallow: /*&addcompare= # Disallow: /*/sid/ Disallow: /*?sid= Disallow: /*&sid= # Disallow: /*?cur= Disallow: /*&cur # Disallow: /*force_sid=* Disallow: /*ldtype=* Disallow: /*_artperpage=* Disallow: /*listorderby=* Disallow: /*listorder=* Disallow: /*newsletter=* # === OPENAI (ChatGPT, GPT-4, ChatGPT Search) === User-agent: GPTBot Allow: / Allow: /llms.txt Crawl-delay: 1 User-agent: ChatGPT-User Allow: / Allow: /llms.txt Crawl-delay: 1 # === GOOGLE AI (Gemini) === User-agent: Google-Extended Allow: / Allow: /llms.txt Crawl-delay: 1 # === ANTHROPIC (Claude) === User-agent: Claude-Web Allow: / Allow: /llms.txt Crawl-delay: 1 User-agent: anthropic-ai Allow: / Allow: /llms.txt Crawl-delay: 1 # === PERPLEXITY === User-agent: PerplexityBot Allow: / Allow: /llms.txt Crawl-delay: 1 # === COMMON CRAWL (AI Training Data) === User-agent: CCBot Allow: / Allow: /llms.txt Crawl-delay: 2 # === WEITERE AI CRAWLER === User-agent: cohere-ai Allow: / Allow: /llms.txt User-agent: Omgilibot Allow: / Allow: /llms.txt User-agent: Applebot-Extended Allow: / Allow: /llms.txt User-agent: facebookexternalhit Allow: / Allow: /llms.txt