McGill University / robots.txt snapshot
← back to mcgill.ca · fetched 2026-06-26T16:59:04Z (1h ago) · HTTP 200 · 3386 bytes · sha256 34318cefd2355fc2 · raw
final URL: https://www.mcgill.ca/robots.txt
| 1 | # |
| 2 | # robots.txt |
| 3 | # |
| 4 | # This file is to prevent the crawling and indexing of certain parts |
| 5 | # of your site by web crawlers and spiders run by sites like Yahoo! |
| 6 | # and Google. By telling these "robots" where not to go on your site, |
| 7 | # you save bandwidth and server resources. |
| 8 | # |
| 9 | # This file will be ignored unless it is at the root of your host: |
| 10 | # Used: http://example.com/robots.txt |
| 11 | # Ignored: http://example.com/site/robots.txt |
| 12 | # |
| 13 | # For more information about the robots.txt standard, see: |
| 14 | # http://www.robotstxt.org/robotstxt.html |
| 15 | |
| 16 | Sitemap: https://www.mcgill.ca/root/sitemap-index.xml |
| 17 | Sitemap: https://www.mcgill.ca/sitemap.xml |
| 18 | |
| 19 | User-agent: Lucidworks-Anda/2.0 |
| 20 | Crawl-delay: 0 |
| 21 | |
| 22 | User-agent: Elastic-Crawler |
| 23 | Crawl-delay: 0 |
| 24 | |
| 25 | User-agent: * |
| 26 | Crawl-delay: 5 |
| 27 | |
| 28 | User-agent: archive.org_bot |
| 29 | Allow: /study/* |
| 30 | |
| 31 | # CSS, JS, Images |
| 32 | Allow: */misc/*.css$ |
| 33 | Allow: */misc/*.css? |
| 34 | Allow: */misc/*.js$ |
| 35 | Allow: */misc/*.js? |
| 36 | Allow: */misc/*.gif |
| 37 | Allow: */misc/*.jpg |
| 38 | Allow: */misc/*.jpeg |
| 39 | Allow: */misc/*.png |
| 40 | Allow: */modules/*.css$ |
| 41 | Allow: */modules/*.css? |
| 42 | Allow: */modules/*.js$ |
| 43 | Allow: */modules/*.js? |
| 44 | Allow: */modules/*.gif |
| 45 | Allow: */modules/*.jpg |
| 46 | Allow: */modules/*.jpeg |
| 47 | Allow: */modules/*.png |
| 48 | Allow: */profiles/*.css$ |
| 49 | Allow: */profiles/*.css? |
| 50 | Allow: */profiles/*.js$ |
| 51 | Allow: */profiles/*.js? |
| 52 | Allow: */profiles/*.gif |
| 53 | Allow: */profiles/*.jpg |
| 54 | Allow: */profiles/*.jpeg |
| 55 | Allow: */profiles/*.png |
| 56 | Allow: */themes/*.css$ |
| 57 | Allow: */themes/*.css? |
| 58 | Allow: */themes/*.js$ |
| 59 | Allow: */themes/*.js? |
| 60 | Allow: */themes/*.gif |
| 61 | Allow: */themes/*.jpg |
| 62 | Allow: */themes/*.jpeg |
| 63 | Allow: */themes/*.png |
| 64 | # Directories |
| 65 | Disallow: */includes/ |
| 66 | Disallow: */modules/ |
| 67 | Disallow: */profiles/ |
| 68 | Disallow: */scripts/ |
| 69 | Disallow: */themes/ |
| 70 | # eCals |
| 71 | Disallow: /study/* |
| 72 | # Files |
| 73 | Disallow: */CHANGELOG.txt |
| 74 | Disallow: */cron.php |
| 75 | Disallow: */INSTALL.mysql.txt |
| 76 | Disallow: */INSTALL.pgsql.txt |
| 77 | Disallow: */INSTALL.sqlite.txt |
| 78 | Disallow: */install.php |
| 79 | Disallow: */INSTALL.txt |
| 80 | Disallow: */LICENSE.txt |
| 81 | Disallow: */MAINTAINERS.txt |
| 82 | Disallow: */update.php |
| 83 | Disallow: */UPGRADE.txt |
| 84 | Disallow: */xmlrpc.php |
| 85 | Disallow: */misc/favicon.ico |
| 86 | # Paths (clean URLs) |
| 87 | Disallow: */admin/ |
| 88 | Disallow: */comment/reply/ |
| 89 | Disallow: */filter/tips/ |
| 90 | Disallow: */node/add/ |
| 91 | Disallow: */search/ |
| 92 | Disallow: /*/people/* |
| 93 | Disallow: /*/events/* |
| 94 | Disallow: /undergraduate-admissions/programs?* |
| 95 | Disallow: /gradapplicants/programs?* |
| 96 | Disallow: */user/register/ |
| 97 | Disallow: */user/password/ |
| 98 | Disallow: */user/login/ |
| 99 | Disallow: */user/logout/ |
| 100 | Disallow: */user |
| 101 | # Paths (no clean URLs) |
| 102 | Disallow: */?q=admin/ |
| 103 | Disallow: */?q=comment/reply/ |
| 104 | Disallow: */?q=filter/tips/ |
| 105 | Disallow: */?q=node/add/ |
| 106 | Disallow: */?q=search/ |
| 107 | Disallow: /?q=study/*/courses/search |
| 108 | Disallow: /?q=study/*/programs/search |
| 109 | Disallow: /?q=study/*/search/all |
| 110 | Disallow: */?q=user/password/ |
| 111 | Disallow: */?q=user/register/ |
| 112 | Disallow: */?q=user/login/ |
| 113 | Disallow: */?q=user/logout/ |
| 114 | Disallow: /*.zip$ |
| 115 | Disallow: /*.gif$ |
| 116 | Disallow: /*.jpg$ |
| 117 | Disallow: /*.jpeg$ |
| 118 | Disallow: /*.png$ |
| 119 | Disallow: /*.tif$ |
| 120 | Disallow: /*.tiff$ |
| 121 | Disallow: /*.dll$ |
| 122 | Disallow: /*.exe$ |
| 123 | Disallow: /*.class$ |
| 124 | Disallow: /*.wmv$ |
| 125 | Disallow: /*.m4v$ |
| 126 | Disallow: /*.jar$ |
| 127 | Disallow: /*.gz$ |
| 128 | Disallow: /*.tar$ |
| 129 | Disallow: /*.css$ |
| 130 | Disallow: /*.inc$ |
| 131 | Disallow: /*.js$ |
| 132 | Disallow: /*.js.php$ |
| 133 | Disallow: /*.swf$ |
| 134 | Disallow: /*.fla$ |
| 135 | Disallow: /*.psd$ |
| 136 | Disallow: /*.m4a$ |
| 137 | Disallow: /*.m4p$ |
| 138 | Disallow: /*.aac$ |
| 139 | Disallow: /*.m2a$ |
| 140 | Disallow: /*.m2v$ |
| 141 | Disallow: /*.sit$ |
| 142 | Disallow: /*.dmg$ |
| 143 | Disallow: /*.wma$ |
| 144 | Disallow: /*.mdb$ |
| 145 | Disallow: /*.tar.gz2$ |
| 146 | Disallow: /*.rar$ |