NeuralCrawl

GlobalFoundries / robots.txt snapshot

← back to gf.com · fetched 2026-06-20T01:10:31Z (15h ago) · HTTP 200 · 2361 bytes · sha256 a1cbf7c00e1fe9c4 · raw

final URL: https://gf.com/robots.txt

1# robots.txt for gf.com
2# Last updated: June 2026
3# Sitemap: https://gf.com/sitemap_index.xml
4
5# -------------------------------------------------------
6# All crawlers (default rules)
7# -------------------------------------------------------
8User-agent: *
9
10# WordPress admin & authentication
11Disallow: /wp-admin/
12Disallow: /wp-login.php
13Disallow: /wp-register.php
14Disallow: /xmlrpc.php
15Disallow: /wp-comments-post.php
16
17# Allow the admin-ajax endpoint (used by front-end functionality Googlebot may need)
18Allow: /wp-admin/admin-ajax.php
19
20# WordPress REST API (exposes internal data)
21Disallow: /wp-json/
22
23# WordPress form uploads (no indexable content)
24Disallow: /wp-content/uploads/wpforms/
25
26# NOTE: /wp-content/plugins/ and /wp-content/themes/ are intentionally NOT
27# blocked. Googlebot needs the CSS/JS in these folders to render pages
28# correctly. Directory browsing should be disabled at the server level,
29# not via robots.txt.
30
31# WordPress utility feeds
32Disallow: /feed/
33Disallow: /comments/feed/
34Disallow: /*/feed/
35Disallow: /*/trackback/
36
37# Search results pages (duplicate content)
38Disallow: /?s=
39Disallow: /search/
40
41# URL parameter-based pages (duplicate content)
42Disallow: /?p=
43Disallow: /?page_id=
44Disallow: /?cat=
45Disallow: /?tag=
46Disallow: /?attachment_id=
47Disallow: /?replytocom=
48
49# Embed pages
50Disallow: /embed/
51
52# Calendar export (iCal)
53Disallow: /news-and-events/events/?ical=
54
55# WP Engine internal sign-on plugin
56Disallow: /wpe_sign_on_plugin/
57
58# -------------------------------------------------------
59# AI crawlers — full access for GEO visibility, but still
60# block the same admin/internal paths.
61# (A crawler matching a specific user-agent group ignores
62# the "*" group entirely, so the disallows are repeated here.)
63# -------------------------------------------------------
64User-agent: GPTBot
65User-agent: ChatGPT-User
66User-agent: OAI-SearchBot
67User-agent: PerplexityBot
68User-agent: ClaudeBot
69User-agent: anthropic-ai
70User-agent: Claude-Web
71User-agent: Google-Extended
72User-agent: cohere-ai
73Allow: /
74Disallow: /wp-admin/
75Disallow: /wp-login.php
76Disallow: /xmlrpc.php
77Disallow: /wp-json/
78Disallow: /wp-content/uploads/wpforms/
79Disallow: /?s=
80Disallow: /wpe_sign_on_plugin/
81
82# -------------------------------------------------------
83# Sitemap
84# -------------------------------------------------------
85Sitemap: https://gf.com/sitemap_index.xml