NeuralCrawl

bioRxiv / robots.txt snapshot

← back to biorxiv.org · fetched 2026-06-26T14:15:22Z (4h ago) · HTTP 200 · 3637 bytes · sha256 1cc8ace946ec6935 · raw

final URL: https://www.biorxiv.org/robots.txt

1#
2# robots.txt
3#
4# This file is to prevent the crawling and indexing of certain parts
5# of your site by web crawlers and spiders run by sites like Yahoo!
6# and Google. By telling these "robots" where not to go on your site,
7# you save bandwidth and server resources.
8#
9# This file will be ignored unless it is at the root of your host:
10# Used: http://example.com/robots.txt
11# Ignored: http://example.com/site/robots.txt
12#
13# For more information about the robots.txt standard, see:
14# http://www.robotstxt.org/robotstxt.html
15
16User-agent: BLEXBot
17Disallow: /
18User-agent: Bytespider
19Disallow: /
20User-agent: Exabot
21Disallow: /
22User-agent: Scanbot
23Disallow: /
24User-agent: Semrush
25Disallow: /
26User-agent: SemrushBot
27Disallow: /
28User-agent: YoudaoBot
29Disallow: /
30User-agent: Baiduspider
31Disallow: /
32User-agent: YandexBot
33Disallow: /
34User-agent: openai
35Disallow: /
36User-agent: Petalbot
37Disallow: /
38User-agent: Bolt
39Disallow: /
40User-agent: BunnySlippers
41Disallow: /
42User-agent: ChatGPT-User
43Disallow: /
44User-agent: GPTBot
45Disallow: /
46User-agent: Gigabot
47Disallow: /
48User-agent: HybridBot
49Disallow: /
50User-agent: JikeSpider
51Disallow: /
52User-agent: SMTBot
53Disallow: /
54User-agent: ScreenerBot
55Disallow: /
56User-agent: SiteLockSpider
57Disallow: /
58User-agent: SuperBot
59Disallow: /
60User-agent: SuperHTTP
61Disallow: /
62User-agent: Amazonbot
63Disallow: /
64User-agent: AhrefsBot
65Disallow: /
66User-agent: Applebot
67Disallow: /
68User-agent: SEMrush
69Disallow: /
70User-agent: DataForSeoBot
71Disallow: /
72User-agent: ClaudeBot
73Disallow: /
74User-agent: DotBot
75Disallow: /
76User-agent: phxbot
77Disallow: /
78User-agent: AwarioBot
79Disallow: /
80User-agent: SeekportBot
81Disallow: /
82User-agent: MJ12bot
83Disallow: /
84User-agent: Majestic12
85Disallow: /
86User-agent: facebookexternalhit/1.1
87Disallow: /
88User-agent: PerplexityBot
89Disallow: /
90User-agent: Qwantbot
91Disallow: /
92User-agent: CCBot
93Disallow: /
94User-agent: python-requests/2.32.3
95Disallow: /
96User-agent: wget
97Disallow: /
98User-agent: curl
99Disallow: /
100
101User-agent: *
102Crawl-delay: 7
103# CSS, JS, Images
104Allow: /misc/*.css$
105Allow: /misc/*.css?
106Allow: /misc/*.js$
107Allow: /misc/*.js?
108Allow: /misc/*.gif
109Allow: /misc/*.jpg
110Allow: /misc/*.jpeg
111Allow: /misc/*.png
112Allow: /modules/*.css$
113Allow: /modules/*.css?
114Allow: /modules/*.js$
115Allow: /modules/*.js?
116Allow: /modules/*.gif
117Allow: /modules/*.jpg
118Allow: /modules/*.jpeg
119Allow: /modules/*.png
120Allow: /profiles/*.css$
121Allow: /profiles/*.css?
122Allow: /profiles/*.js$
123Allow: /profiles/*.js?
124Allow: /profiles/*.gif
125Allow: /profiles/*.jpg
126Allow: /profiles/*.jpeg
127Allow: /profiles/*.png
128Allow: /themes/*.css$
129Allow: /themes/*.css?
130Allow: /themes/*.js$
131Allow: /themes/*.js?
132Allow: /themes/*.gif
133Allow: /themes/*.jpg
134Allow: /themes/*.jpeg
135Allow: /themes/*.png
136# Directories
137Disallow: /includes/
138Disallow: /misc/
139Disallow: /modules/
140Disallow: /profiles/
141Disallow: /scripts/
142Disallow: /themes/
143# Files
144Disallow: /CHANGELOG.txt
145Disallow: /cron.php
146Disallow: /INSTALL.mysql.txt
147Disallow: /INSTALL.pgsql.txt
148Disallow: /INSTALL.sqlite.txt
149Disallow: /install.php
150Disallow: /INSTALL.txt
151Disallow: /LICENSE.txt
152Disallow: /MAINTAINERS.txt
153Disallow: /update.php
154Disallow: /UPGRADE.txt
155Disallow: /xmlrpc.php
156# Paths (clean URLs)
157Disallow: /admin/
158Disallow: /comment/reply/
159Disallow: /filter/tips/
160Disallow: /node/add/
161Disallow: /search/
162Disallow: /user/register/
163Disallow: /user/password/
164Disallow: /user/login/
165Disallow: /user/logout/
166# Paths (no clean URLs)
167Disallow: /?q=admin/
168Disallow: /?q=comment/reply/
169Disallow: /?q=filter/tips/
170Disallow: /?q=node/add/
171Disallow: /?q=search/
172Disallow: /?q=user/password/
173Disallow: /?q=user/register/
174Disallow: /?q=user/login/
175Disallow: /?q=user/logout/
176Disallow: /user