# robots.txt for http://www.dcs.hull.ac.uk/ # see for an explanation. User-agent: CherryPickerSE/1.0 CherryPickerElite/1.0 EmailCollector/1.0 EmailWolf EmailSiphon WebCopier Disallow: * Disallow: / User-agent: * # Some Robots use regexp and globbing and some do not. # The rules will keep out those nosey ones who do # Ignore edit backups! - for globbers Disallow: *~ # ignore dotted directories - for globbers Disallow: /\. # ignore dotted directories - for non-globbers Disallow: /. Disallow: /etc/ Disallow: /tmp/ Disallow: /incoming/ Disallow: /usr/ Disallow: /lib/ Disallow: /dev/ Disallow: /alex/ Disallow: /bin/ Disallow: /news/ Disallow: /cgi-bin/ Disallow: /WWW/cgi-bin/ Disallow: /lost+found/ # ignore dotted directories - for globbers Disallow: /public/\. # ignore dotted directories - for non globbers Disallow: /public/. Disallow: /public/etc/ Disallow: /public/tmp/ Disallow: /public/incoming/ Disallow: /public/usr/ Disallow: /public/lib/ Disallow: /public/dev/ Disallow: /public/alex/ Disallow: /public/bin/ Disallow: /public/news/ # stop file name loops! Disallow: /public/public/ Disallow: /public/WWW/cgi-bin/ Disallow: /public/lost+found/ # In case the crawler globs Disallow: /public/lost\+found/ # Stop atext being silly! Disallow: /public/wais-sources/internet-servers # All these rules just for atext, who is daft; and makes speculative grabs Disallow: /public/etc/public/ Disallow: /public/tmp/public/ Disallow: /public/incoming/public/ Disallow: /public/usr/public/ Disallow: /public/lib/public/ Disallow: /public/dev/public/ Disallow: /public/alex/public/ Disallow: /public/bin/public/ Disallow: /public/news/public/ Disallow: /public/WWW/public/ Disallow: /public/WWW/cgi-bin/public/ Disallow: /public/lost+found/public/ Disallow: /public/wais-sources/public/ Disallow: /public/faces/public/ Disallow: /public/Hull/public/ # stop indexing of student user pages and alien departments Disallow: /~ee Disallow: /~ee* Disallow: /~dm Disallow: /~dm* Disallow: /~ms Disallow: /~ms* Disallow: /~csm Disallow: /~csm* Disallow: /~cs5 Disallow: /~cs5* Disallow: /~cs6 Disallow: /~cs6* Disallow: /~cs7 Disallow: /~cs7* Disallow: /~cs8 Disallow: /~cs8* Disallow: /~cs9 Disallow: /~cs9* Disallow: /~cs0 Disallow: /~cs0*