NeuralCrawl

Warner Music Group / robots.txt snapshot

← back to wmg.com · fetched 2026-06-20T01:10:31Z (15h ago) · HTTP 200 · 2783 bytes · sha256 dd38573bbab90acd · raw

final URL: https://wmg.com/robots.txt

1#
2# robots.txt
3#
4# This file is to prevent the crawling and indexing of certain parts
5# of your site by web crawlers and spiders run by sites like Yahoo!
6# and Google. By telling these "robots" where not to go on your site,
7# you save bandwidth and server resources.
8#
9# This file will be ignored unless it is at the root of your host:
10# Used: http://example.com/robots.txt
11# Ignored: http://example.com/site/robots.txt
12#
13# For more information about the robots.txt standard, see:
14# http://www.robotstxt.org/robotstxt.html
15
16User-agent: *
17Crawl-delay: 10
18# CSS, JS, Images
19Allow: /misc/*.css$
20Allow: /misc/*.css?
21Allow: /misc/*.js$
22Allow: /misc/*.js?
23Allow: /misc/*.gif
24Allow: /misc/*.jpg
25Allow: /misc/*.jpeg
26Allow: /misc/*.png
27Allow: /modules/*.css$
28Allow: /modules/*.css?
29Allow: /modules/*.js$
30Allow: /modules/*.js?
31Allow: /modules/*.gif
32Allow: /modules/*.jpg
33Allow: /modules/*.jpeg
34Allow: /modules/*.png
35Allow: /profiles/*.css$
36Allow: /profiles/*.css?
37Allow: /profiles/*.js$
38Allow: /profiles/*.js?
39Allow: /profiles/*.gif
40Allow: /profiles/*.jpg
41Allow: /profiles/*.jpeg
42Allow: /profiles/*.png
43Allow: /themes/*.css$
44Allow: /themes/*.css?
45Allow: /themes/*.js$
46Allow: /themes/*.js?
47Allow: /themes/*.gif
48Allow: /themes/*.jpg
49Allow: /themes/*.jpeg
50Allow: /themes/*.png
51# Directories
52Disallow: /includes/
53Disallow: /misc/
54Disallow: /modules/
55Disallow: /profiles/
56Disallow: /scripts/
57Disallow: /themes/
58# Files
59Disallow: /CHANGELOG.txt
60Disallow: /cron.php
61Disallow: /INSTALL.mysql.txt
62Disallow: /INSTALL.pgsql.txt
63Disallow: /INSTALL.sqlite.txt
64Disallow: /install.php
65Disallow: /INSTALL.txt
66Disallow: /LICENSE.txt
67Disallow: /MAINTAINERS.txt
68Disallow: /update.php
69Disallow: /UPGRADE.txt
70Disallow: /xmlrpc.php
71# Paths (clean URLs)
72Disallow: /admin/
73Disallow: /comment/reply/
74Disallow: /filter/tips/
75Disallow: /node/add/
76Disallow: /search/
77Disallow: /user/register/
78Disallow: /user/password/
79Disallow: /user/login/
80Disallow: /user/logout/
81Disallow: /member/
82# Paths (no clean URLs)
83Disallow: /?q=admin/
84Disallow: /?q=comment/reply/
85Disallow: /?q=filter/tips/
86Disallow: /?q=node/add/
87Disallow: /?q=search/
88Disallow: /?q=user/password/
89Disallow: /?q=user/register/
90Disallow: /?q=user/login/
91Disallow: /?q=user/logout/
92Disallow: /?frontpage=true
93Disallow: /?ref=[\w&='" _. ]+/
94
95# wordpress
96
97Disallow: /cgi-bin
98Disallow: /wp-admin
99Disallow: /wp-includes
100Disallow: /wp-content/plugins
101Disallow: /wp-content/cache
102Disallow: /wp-content/themes
103Disallow: /trackback
104Disallow: /feed
105Disallow: /comments
106Disallow: /category/*/*
107Disallow: */trackback
108Disallow: */feed
109Disallow: */comments
110Disallow: /*?*
111Disallow: /*?
112Allow: /wp-content/uploads
113
114# Google Image
115User-agent: Googlebot-Image
116Allow: /*
117Disallow: /cgi-bin
118Disallow: /wp-admin
119Disallow: /wp-includes
120Disallow: /trackback
121Disallow: /comments