1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69
|
#
# This file lists local URLs that well-behaved robots should ignore
User-agent: *
Disallow: /cgi-bin/ # includes some large virtual spaces
Disallow: /analog/ # skip usage reports
Disallow: /mirrors # skip local mirrors
Disallow: /adm/ # local web server admin stuff
Disallow: /dcs # moved to /its
Disallow: /its/about # moved to /ict
Disallow: /its/accounts # moved to /ict
Disallow: /its/guides # moved to /ict
Disallow: /its/hardware # moved to /ict
Disallow: /its/services # moved to /ict
Disallow: /calendar/archive/ # old U of S calendars
Disallow: /calendar/coursecat/ # old U of S catalogue
Disallow: /index.php/ # confused robots
Disallow: /sas/secc/cards # only available on campus
Disallow: /redirect.php # google keeps asking for this
Disallow: /registrar/cdrom # not ready for prime time
Disallow: /registrar/01_02_Calendar/
Disallow: /registrar/00_01_Calendar/
Disallow: /registrar/99_00_Calendar/
Disallow: /registrar/98_99_Calendar/
Disallow: /registrar/97_98_Calendar/
Disallow: /registrar/95_96_Calendar/
Disallow: /registrar/archives # old stuff
Disallow: /art/digital_culture/ # old stuff
Disallow: /education/coursework/ # old stuff
Disallow: /archives/eadtest/ # by request
Disallow: /archives/ccad/ # by request
Disallow: /archives/sca/ccagrants/ # by request
Disallow: /antharch/cnea/CourseNotes/erosslides.html # sensitive content
Disallow: /test/
Disallow: /fsd/ # by request ISD-93885
Disallow: /fsd/frames/ # by request
Disallow: /ulc/lc/lc/ # recursive link
Disallow: /medicine/agmedicine/ # old stuff
Disallow: /includes/ # we'd rather not have this in search results
Disallow: /includes_cascade/ # we'd rather not have this in search results
Disallow: /manual/ # lots of broken links (problem with languages)
Disallow: /calendar/code/ # we'd rather not have this in search results
Disallow: /sesd/sesdconnects/ # by request of Craig McNaughton
Disallow: /taitprojects/content/paws-and-webmail # confusing
Disallow: /learningcommons/booking/mrbs/ # reduce load
Disallow: /search/ # so search results don't appear in search results
# search engines only need one calendar view, so hide the rest
Disallow: /events/day.php
Disallow: /events/week.php
Disallow: /events/print.php
Disallow: /events/
#
# mailing list archives (deprecated)
#
Disallow: /lists/
#
# Sandboxes and code bases - WCS-1562
#
Disallow: /_uofs-codebase/
Disallow: /_uofs-site-basic/
Disallow: /_usask/
Disallow: /arts-sandbox/
Disallow: /wcs-sandbox/
Disallow: /wcms-sandbox/
Disallow: /usaskcdn-sandbox/
|