diff --git a/CLAUDE.md b/CLAUDE.md index f256938..d77b57b 100644 --- a/CLAUDE.md +++ b/CLAUDE.md @@ -213,6 +213,8 @@ CHANGE_LOG: - "STRUCTURE: aktive vs. legacy CSS/JS getrennt, videos/, downloads/, insights/, accountforger-video.html, weitere Top-Level-Files ergänzt" - "Lagen-Layout: cyberangriffe und deepfakes binden Lagebild-CSS/JS aus iran-konflikt ein (zentrale Assets)" - "SERVICES: sync-lagebild und insights ergänzt" + - "SEO Stufe 1: noindex/nofollow von 12 indexierbaren Seiten entfernt; robots.txt scharf geschaltet (Live-Search-AI-Bots erlaubt, Training-Bots geblockt); sitemap.xml deployt" + - "Lagen-Seiten: description, canonical, Open Graph, Twitter Card, Schema.org Article ergänzt; Topic-Default in #incident-title als Crawler-Fallback" Last-Updated: 2026-05-10 diff --git a/datenschutz.html b/datenschutz.html index 3393f20..6601ba6 100644 --- a/datenschutz.html +++ b/datenschutz.html @@ -6,7 +6,6 @@ Datenschutz – AegisSight - diff --git a/en/index.html b/en/index.html index e431aa6..5aa2633 100644 --- a/en/index.html +++ b/en/index.html @@ -5,7 +5,6 @@ AegisSight Monitor – Real-time situation reports from open sources - diff --git a/en/legal-notice.html b/en/legal-notice.html index e9e6034..775a4c7 100644 --- a/en/legal-notice.html +++ b/en/legal-notice.html @@ -6,7 +6,6 @@ Legal notice – AegisSight - diff --git a/en/privacy.html b/en/privacy.html index b950f47..5b8ab37 100644 --- a/en/privacy.html +++ b/en/privacy.html @@ -6,7 +6,6 @@ Privacy policy – AegisSight - diff --git a/en/situations/cyber-attacks/index.html b/en/situations/cyber-attacks/index.html index 37ea87b..f900945 100644 --- a/en/situations/cyber-attacks/index.html +++ b/en/situations/cyber-attacks/index.html @@ -4,10 +4,64 @@ Situation report: Cyberattacks on German infrastructure - AegisSight - + + + + + + + + + + + + + + + + + + + + + + + + + @@ -67,7 +121,7 @@

SITUATION REPORT

-

+

Cyberattacks on German Infrastructure

diff --git a/en/situations/deepfakes/index.html b/en/situations/deepfakes/index.html index d8c140b..97f5c2e 100644 --- a/en/situations/deepfakes/index.html +++ b/en/situations/deepfakes/index.html @@ -4,10 +4,64 @@ Research: Legal status of deepfakes in Germany - AegisSight - + + + + + + + + + + + + + + + + + + + + + + + + + @@ -74,7 +128,7 @@

RESEARCH BRIEFING

-

+

Legal Status of Deepfakes in Germany

diff --git a/en/situations/iran-conflict/index.html b/en/situations/iran-conflict/index.html index 36e6b55..9f23875 100644 --- a/en/situations/iran-conflict/index.html +++ b/en/situations/iran-conflict/index.html @@ -4,10 +4,64 @@ Situation report: Iran conflict - AegisSight - + + + + + + + + + + + + + + + + + + + + + + + + + @@ -74,7 +128,7 @@

SITUATION REPORT

-

+

Iran Conflict

diff --git a/impressum.html b/impressum.html index 9a94deb..4759e31 100644 --- a/impressum.html +++ b/impressum.html @@ -6,7 +6,6 @@ Impressum – AegisSight - diff --git a/index.html b/index.html index 0eeb7ae..fee50f7 100644 --- a/index.html +++ b/index.html @@ -5,7 +5,6 @@ AegisSight Monitor – Echtzeit-Lagebilder aus offenen Quellen - diff --git a/lagen/cyberangriffe/index.html b/lagen/cyberangriffe/index.html index a0ec6ad..d37daa9 100644 --- a/lagen/cyberangriffe/index.html +++ b/lagen/cyberangriffe/index.html @@ -4,10 +4,64 @@ Lagebild: Cyberangriffe auf deutsche Infrastruktur - AegisSight - + + + + + + + + + + + + + + + + + + + + + + + + + @@ -66,7 +120,7 @@

LAGEBILD

-

+

Cyberangriffe auf deutsche Infrastruktur

diff --git a/lagen/deepfakes/index.html b/lagen/deepfakes/index.html index 33959f2..a92f2a0 100644 --- a/lagen/deepfakes/index.html +++ b/lagen/deepfakes/index.html @@ -4,10 +4,64 @@ Recherche: Rechtliche Lage von Deepfakes in Deutschland - AegisSight - + + + + + + + + + + + + + + + + + + + + + + + + + @@ -73,7 +127,7 @@

RECHERCHE

-

+

Rechtliche Lage von Deepfakes in Deutschland

diff --git a/lagen/iran-konflikt/index.html b/lagen/iran-konflikt/index.html index 3f632e3..2562307 100644 --- a/lagen/iran-konflikt/index.html +++ b/lagen/iran-konflikt/index.html @@ -4,10 +4,64 @@ Lagebild Irankonflikt - AegisSight - + + + + + + + + + + + + + + + + + + + + + + + + + @@ -73,7 +127,7 @@

LAGEBILD

-

+

Iran-Konflikt

diff --git a/robots.txt b/robots.txt index ca4047a..6807159 100644 --- a/robots.txt +++ b/robots.txt @@ -1,94 +1,23 @@ -# robots.txt for AegisSight UG -# Block ALL web crawlers and bots from the entire site +# robots.txt - AegisSight UG +# Crawling allgemein erlaubt, ausser API/interne Pfade +# Keine Trainingsdaten-Verwendung durch AI-Crawler (Training-Bots geblockt) +# Live-Search-AI-Bots (OAI-SearchBot, ChatGPT-User, ClaudeBot, PerplexityBot) sind erlaubt -# Block all bots User-agent: * -Disallow: / -Crawl-delay: 86400 +Allow: / +Disallow: /api/ +Disallow: /_archiv/ +Disallow: /insights/ -# Specifically block major search engines -User-agent: Googlebot -Disallow: / +# Sitemap +Sitemap: https://aegis-sight.de/sitemap.xml -User-agent: Bingbot -Disallow: / - -User-agent: Slurp -Disallow: / - -User-agent: DuckDuckBot -Disallow: / - -User-agent: Baiduspider -Disallow: / - -User-agent: YandexBot -Disallow: / - -# Block social media crawlers -User-agent: facebookexternalhit -Disallow: / - -User-agent: Twitterbot -Disallow: / - -User-agent: LinkedInBot -Disallow: / - -User-agent: WhatsApp -Disallow: / - -User-agent: TelegramBot -Disallow: / - -# Block SEO and analysis bots -User-agent: AhrefsBot -Disallow: / - -User-agent: SemrushBot -Disallow: / - -User-agent: DotBot -Disallow: / - -User-agent: MJ12bot -Disallow: / - -User-agent: SEOkicks-Robot -Disallow: / - -User-agent: SeznamBot -Disallow: / - -User-agent: MauiBot -Disallow: / - -User-agent: Majestic-12 -Disallow: / - -User-agent: Majestic-SEO -Disallow: / - -# Block archiving bots -User-agent: ia_archiver -Disallow: / - -User-agent: Wayback Machine -Disallow: / - -User-agent: SiteSnagger -Disallow: / - -User-agent: WebCopier -Disallow: / - -# Block AI/ML crawlers +# ---------------------------------------------------------------------- +# AI-Training-Crawler -- BLOCKED (kein Training auf unseren Inhalten) +# ---------------------------------------------------------------------- User-agent: GPTBot Disallow: / -User-agent: ChatGPT-User -Disallow: / - User-agent: CCBot Disallow: / @@ -98,15 +27,86 @@ Disallow: / User-agent: Claude-Web Disallow: / -# Block download managers -User-agent: wget +User-agent: Google-Extended Disallow: / -User-agent: curl +User-agent: Applebot-Extended Disallow: / +User-agent: Meta-ExternalAgent +Disallow: / + +User-agent: Bytespider +Disallow: / + +User-agent: cohere-ai +Disallow: / + +User-agent: FacebookBot +Disallow: / + +User-agent: ImagesiftBot +Disallow: / + +User-agent: Diffbot +Disallow: / + +User-agent: Omgilibot +Disallow: / + +# ---------------------------------------------------------------------- +# AI-Live-Search-Crawler -- ALLOWED (Sichtbarkeit in KI-Antworten) +# OAI-SearchBot, ChatGPT-User, ClaudeBot, PerplexityBot werden NICHT +# blockiert. Sie crawlen fuer Live-Antworten, nicht fuer Training. +# ---------------------------------------------------------------------- + +# ---------------------------------------------------------------------- +# Archiv-Bots +# ---------------------------------------------------------------------- +User-agent: ia_archiver +Disallow: / + +User-agent: archive.org_bot +Disallow: / + +# ---------------------------------------------------------------------- +# SEO-/Spam-Crawler +# ---------------------------------------------------------------------- +User-agent: AhrefsBot +Disallow: / + +User-agent: SemrushBot +Disallow: / + +User-agent: MJ12bot +Disallow: / + +User-agent: DotBot +Disallow: / + +User-agent: SEOkicks-Robot +Disallow: / + +User-agent: MauiBot +Disallow: / + +User-agent: Majestic-12 +Disallow: / + +User-agent: BLEXBot +Disallow: / + +User-agent: SerendeputyBot +Disallow: / + +# ---------------------------------------------------------------------- +# Download-Manager +# ---------------------------------------------------------------------- User-agent: HTTrack Disallow: / -# No sitemap provided -# No crawl permissions granted \ No newline at end of file +User-agent: SiteSnagger +Disallow: / + +User-agent: WebCopier +Disallow: / diff --git a/sitemap.xml b/sitemap.xml new file mode 100644 index 0000000..9183821 --- /dev/null +++ b/sitemap.xml @@ -0,0 +1,100 @@ + + + + https://aegis-sight.de/ + weekly + 1.0 + + + + + + https://aegis-sight.de/en/ + weekly + 1.0 + + + + + + https://aegis-sight.de/lagen/iran-konflikt/ + daily + 0.8 + + + + + + https://aegis-sight.de/en/situations/iran-conflict/ + daily + 0.8 + + + + + + https://aegis-sight.de/lagen/cyberangriffe/ + daily + 0.8 + + + + + + https://aegis-sight.de/en/situations/cyber-attacks/ + daily + 0.8 + + + + + + https://aegis-sight.de/lagen/deepfakes/ + weekly + 0.7 + + + + + + https://aegis-sight.de/en/situations/deepfakes/ + weekly + 0.7 + + + + + + https://aegis-sight.de/impressum.html + yearly + 0.3 + + + + + + https://aegis-sight.de/en/legal-notice.html + yearly + 0.3 + + + + + + https://aegis-sight.de/datenschutz.html + yearly + 0.3 + + + + + + https://aegis-sight.de/en/privacy.html + yearly + 0.3 + + + + +