Sitemap: https://www.thueringer-allgemeine.de/sitemaps/news.xml User-agent: * Allow: /static/*/client.js Allow: /static/*/main.css Allow: /static/*/favicon.png Disallow: /stats/* Disallow: /*?config* Disallow: /*.xmli* Disallow: /*?service=Ajax Disallow: /*?service=ajax Disallow: /config/* Disallow: /test/* Disallow: /Test/* Disallow: /template/* Disallow: /*?*token=* Disallow: /*?*eventId=* Disallow: /static/* Disallow: /migration_import_no_section/* Disallow: /secure/ Disallow: /socialmedia/* Disallow: *reader_id=READER_ID* Disallow: /suche/* Disallow: /*?widgetid= Disallow: /newsletter-result/ Disallow: *tpcc=* Disallow: /resources/ Disallow: /bin/ Disallow: /downloads/ Disallow: /service/newsletter-adconsent Disallow: /pagespeed_static/ Disallow: /resources/img/*icon*pagespeed # search engines User-agent: Cliqzbot User-agent: Baiduspider User-agent: sogou spider User-agent: Baiduspider User-agent: Flamingo_SearchEngine User-agent: SeznamBot User-agent: Yandex Disallow: / # seo tools User-agent: SemrushBot-SA User-agent: AhrefsBot User-agent: BacklinkCrawler User-agent: LinkChecker User-agent: DataForSeoBot User-agent: deepcrawl User-agent: Majestic User-agent: Majestic12 User-agent: MJ12bot User-agent: OnPageBot User-agent: Optimizer User-agent: RyteBot User-agent: SemrushBot User-agent: Semrushbot-SI User-agent: Seobility User-agent: SEOdiver User-agent: SEOkicks User-agent: SEOkicks-Robot User-agent: sistrix User-agent: OpenindexSpider User-agent: openindexspider User-agent: SISTRIX Optimizer User-agent: SISTRIX User-agent: SISTRIX Crawler User-agent: SiteAuditBot Disallow: / # ai tools User-agent: Amazonbot User-agent: anthropic-ai User-agent: Applebot-Extended User-agent: archive.org_bot User-agent: Bytespider User-agent: CCBot User-agent: ChatGPT-User User-agent: ClaudeBot User-agent: Claude-Web User-agent: cohere-ai User-agent: Diffbot User-agent: FacebookBot User-agent: FriendlyCrawler User-agent: Google-Extended User-agent: GoogleOther User-agent: GPTBot User-agent: ia_archiver User-agent: img2dataset User-agent: omgili User-agent: omgilibot User-agent: peer39_crawler User-agent: peer39_crawler/1.0 User-agent: PerplexityBot User-agent: YouBot User-Agent: meta-externalagent User-Agent: ImagesiftBot Disallow: / # other User-agent: arquivo-web-crawler User-agent: arquivo.pt User-agent: Barkrowler User-agent: BLEXBot User-agent: browsertrix User-agent: brozzler User-agent: BuiltWith User-agent: Cincraw User-agent: coccocbot User-agent: contao/crawler User-agent: Dmbot User-agent: DomainStatsBot User-agent: DotBot User-agent: dotbot User-agent: fluid User-agent: HaosouSpider User-agent: HappyWing User-agent: harsilbot User-agent: hatena antenna User-agent: Heritrix User-agent: ImagesiftBot User-agent: kazbtbot User-agent: Kraken User-agent: linkdebot User-agent: Linkfluence Yak Bot User-agent: mail.RU_Bot User-agent: MetaJobBot User-agent: Monsidobot User-agent: netEstate User-agent: OGDWCtcxCrawler User-agent: PetalBot User-agent: ResearchBot User-agent: Riddler User-agent: SentiBot User-agent: rogerbot User-agent: Semanticbot User-agent: SemanticScholarBot User-agent: SirdataBot User-agent: spbot User-agent: special_archiver User-agent: SplitSignalBot User-agent: Tag-Crawler User-agent: Testcrawler User-agent: thinkers-bot User-agent: Toplistbot User-agent: uipbot/1.0 User-agent: urlsuma User-agent: User-agent User-agent: VsuSearchSpider User-agent: weborama-fetcher User-agent: WiseGuys Robot User-agent: wpbot User-agent: Yeti Disallow: /