2001-01-05 11:42:11 +00:00
|
|
|
# /robots.txt for http://www.musi-cal.com/
|
|
|
|
|
# See http://info.webcrawler.com/mak/projects/robots/norobots.html
|
|
|
|
|
# Skip Montanaro (skip@mojam.com)
|
|
|
|
|
# - adapted from the robots.txt file at http://web.nexor.co.uk/
|
|
|
|
|
|
|
|
|
|
# disallow a bunch of ill-behaved user agents (doubt this will deter them...)
|
2001-02-20 09:32:36 +00:00
|
|
|
|
2001-01-05 11:42:11 +00:00
|
|
|
User-agent: ExtractorPro
|
|
|
|
|
Disallow: /
|
2001-02-20 09:32:36 +00:00
|
|
|
|
2001-01-05 11:42:11 +00:00
|
|
|
User-agent: EmailSiphon
|
|
|
|
|
Disallow: /
|
2001-02-20 09:32:36 +00:00
|
|
|
|
2001-01-05 11:42:11 +00:00
|
|
|
User-agent: EmailWolf
|
|
|
|
|
Disallow: /
|
2001-02-20 09:32:36 +00:00
|
|
|
|
2001-01-05 11:42:11 +00:00
|
|
|
User-agent: CherryPickerSE/1.0
|
|
|
|
|
Disallow: /
|
2001-02-20 09:32:36 +00:00
|
|
|
|
2001-01-05 11:42:11 +00:00
|
|
|
User-agent: CherryPickerElite/1.0
|
|
|
|
|
Disallow: /
|
2001-02-20 09:32:36 +00:00
|
|
|
|
2001-01-05 11:42:11 +00:00
|
|
|
User-agent: EmailCollector/1.0
|
|
|
|
|
Disallow: /
|
2001-02-20 09:32:36 +00:00
|
|
|
|
2001-01-05 11:42:11 +00:00
|
|
|
User-agent: EmailWolf 1.00
|
|
|
|
|
Disallow: /
|
2001-02-20 09:32:36 +00:00
|
|
|
|
2001-01-05 11:42:11 +00:00
|
|
|
User-agent: Crescent Internet ToolPak HTTP OLE Control v.1.0
|
|
|
|
|
Disallow: /
|
2001-02-20 09:32:36 +00:00
|
|
|
|
2001-01-05 11:42:11 +00:00
|
|
|
User-agent: EmailSiphon
|
|
|
|
|
Disallow: /
|
2001-02-20 09:32:36 +00:00
|
|
|
|
2001-01-05 11:42:11 +00:00
|
|
|
User-agent: Mozilla/2.0 (compatible; NEWT ActiveX; Win32)
|
2001-02-20 09:32:36 +00:00
|
|
|
Disallow: /
|
|
|
|
|
|
|
|
|
|
# by default
|
|
|
|
|
|
|
|
|
|
User-agent: *
|
|
|
|
|
Disallow: /ccrd # not useful to spiders
|
|
|
|
|
Disallow: /click # not useful to spiders
|
|
|
|
|
Disallow: /search # dynamic
|
|
|
|
|
Disallow: /hc # dynamic
|
|
|
|
|
Disallow: /subbatch # dynamic
|
|
|
|
|
Disallow: /vadd # dynamic
|
|
|
|
|
Disallow: /vsearch # dynamic
|
|
|
|
|
Disallow: /vedit # dynamic
|
|
|
|
|
Disallow: /vdelete # dynamic
|
|
|
|
|
Disallow: /cgi-bin # dynamic
|
|
|
|
|
Disallow: /images/ # useless images
|
|
|
|
|
Disallow: /icons/ # useless images
|
|
|
|
|
Disallow: /concerts/ # deprecated URL form
|
|
|
|
|
Disallow: /conferences # defunct
|
|
|
|
|
Disallow: /musician # defunct
|
|
|
|
|
Disallow: /~skip/volkswagen # defunct
|
|
|
|
|
Disallow: /%7Eskip/volkswagen # defunct
|
|
|
|
|
|