De Telegraaf / robots.txt snapshot
← back to telegraaf.nl · fetched 2026-06-20T01:10:30Z (18h ago) · HTTP 200 · 2656 bytes · sha256 e12e0c1acebf9301 · raw
final URL: https://www.telegraaf.nl/robots.txt
| 1 | # Generated: 2026-06-18T09:55:50.306Z |
| 2 | # Brand: telegraaf.nl | Environment: prod |
| 3 | |
| 4 | # All copyrights, neighbouring rights and database rights in the content and layout of this website/app are explicitly reserved and are for personal, non-commercial use only. |
| 5 | # In accordance with Article 4 of the Directive on Copyright in the Digital Single Market (CDSM) and its transposition into the law of the applicable Member State, |
| 6 | # all content of this website on which it is made available is not to be used for the purposes of text and data mining, extraction, scraping and/or the use of programs or robots |
| 7 | # for automatic data collection and/or extraction of digital data, whether for machine learning or artificial intelligence purposes or otherwise. |
| 8 | # See also the Terms and Conditions of this website. |
| 9 | |
| 10 | # robots.txt prod De Telegraaf |
| 11 | user-agent: * |
| 12 | Allow: / |
| 13 | Allow: /tags |
| 14 | |
| 15 | # Disallow Internal Search |
| 16 | Disallow: /zoeken/ |
| 17 | |
| 18 | # Disallow bundle |
| 19 | Disallow: /*?bundle |
| 20 | |
| 21 | # Disallow infront widgets |
| 22 | Disallow: /infront/widget/ |
| 23 | |
| 24 | # Disallow Sponsored Articles for Google News |
| 25 | User-agent: Googlebot-News |
| 26 | Disallow: /branded-content/ |
| 27 | Disallow: /brandedcontent/ |
| 28 | |
| 29 | # Disallow Large Language Models |
| 30 | User-agent: Amazonbot |
| 31 | Disallow: / |
| 32 | |
| 33 | User-agent: anthropic-ai |
| 34 | Disallow: / |
| 35 | |
| 36 | User-agent: Bytespider |
| 37 | Disallow: / |
| 38 | |
| 39 | User-agent: CCBot |
| 40 | Disallow: / |
| 41 | |
| 42 | User-agent: ChatGPT-User |
| 43 | Disallow: / |
| 44 | |
| 45 | User-agent: ClaudeBot |
| 46 | Disallow: / |
| 47 | |
| 48 | User-agent: Claude-Web |
| 49 | Disallow: / |
| 50 | |
| 51 | User-agent: cohere-ai |
| 52 | Disallow: / |
| 53 | |
| 54 | User-agent: Diffbot |
| 55 | Disallow: / |
| 56 | |
| 57 | User-agent: FacebookBot |
| 58 | Disallow: / |
| 59 | |
| 60 | User-agent: Google-Extended |
| 61 | Disallow: / |
| 62 | |
| 63 | User-agent: GPTBot |
| 64 | Disallow: / |
| 65 | |
| 66 | User-agent: magpie-crawler |
| 67 | Disallow: / |
| 68 | |
| 69 | User-agent: omgili |
| 70 | Disallow: / |
| 71 | |
| 72 | User-agent: omgilibot |
| 73 | Disallow: / |
| 74 | |
| 75 | User-agent: PerplexityBot |
| 76 | Disallow: / |
| 77 | |
| 78 | User-agent: Google-CloudVertexBot |
| 79 | Disallow: / |
| 80 | |
| 81 | User-agent: meta-externalagent |
| 82 | Disallow: / |
| 83 | |
| 84 | User-agent: meta-externalfetcher |
| 85 | Disallow: / |
| 86 | |
| 87 | User-agent: Ahrefsbot |
| 88 | Disallow: / |
| 89 | |
| 90 | User-agent: Archive.org_bot |
| 91 | Disallow: / |
| 92 | |
| 93 | User-agent: Bravebot |
| 94 | Disallow: / |
| 95 | |
| 96 | User-agent: Claude-Searchbot |
| 97 | Disallow: / |
| 98 | |
| 99 | User-agent: Claude-User |
| 100 | Disallow: / |
| 101 | |
| 102 | User-agent: DeepSeekBot |
| 103 | Disallow: / |
| 104 | |
| 105 | User-agent: Meta-WebIndexer |
| 106 | Disallow: / |
| 107 | |
| 108 | User-agent: MistralAI-Index |
| 109 | Disallow: / |
| 110 | |
| 111 | User-agent: MistralAI-User |
| 112 | Disallow: / |
| 113 | |
| 114 | User-agent: OAI-AdsBot |
| 115 | Disallow: / |
| 116 | |
| 117 | User-agent: OAI-Searchbot |
| 118 | Disallow: / |
| 119 | |
| 120 | User-agent: Perplexity-User |
| 121 | Disallow: / |
| 122 | |
| 123 | User-agent: Youbot |
| 124 | Disallow: / |
| 125 | |
| 126 | # User-agent: Bingbot |
| 127 | # Disallow: / |
| 128 | |
| 129 | #list sitemaps |
| 130 | Sitemap: https://www.telegraaf.nl/sitemap.xml |
| 131 | Sitemap: https://www.telegraaf.nl/sitemap-image.xml |
| 132 | Sitemap: https://www.telegraaf.nl/sitemap-news.xml |
| 133 | Sitemap: https://www.telegraaf.nl/sitemap-video.xml |
| 134 | |
| 135 | # Served via new CDN |