# robots.txt for http://www.alegria.com/ User-agent: * # why not let them in? #Disallow: /telecine/hypermail/ # This is hypermail's huge database #Disallow: /telecine/mhonarc/ # mhonarc's # to kill the pipermail mailman archives txt.gz from being indexed see # http://www.nextthing.org/archives/2007/03/12/robotstxt-adventure Disallow: /*.txt.gz$ Disallow: /Excite Disallow: /php3/ Disallow: /usage.colorist/ Disallow: /usage.tig.colorist/ Disallow: /stats-2000/ Disallow: /stats-1999/ Disallow: /stats-1998/ Disallow: /stats-1997/ Disallow: /stats-1996/ Disallow: /stats-1995/ Disallow: /stats-1994/ Disallow: /mindterm_3.1.2/ # old Disallow: /cgi-bin/ Disallow: /telecinehome.phtml/ # this is the weird prepended dir to # those multiple strange pathnames Disallow: /accesswatch-1.33/ Disallow: /96/ Disallow: /95/ Disallow: /94/ # to shield legitimate webcrawlers? Disallow: /cgi-bin/mailinglists # per http://www.mediawiki.org/wiki/Manual:Short_URL Disallow: /wiki3/ Disallow: /wiki/Special:Search Disallow: /wiki/Special:Random # until the webpages are ready Disallow: /twiki/ Disallow: /test/ Disallow: /test/dira/ Disallow: /test/dirb/ Disallow: /test.phtml Disallow: /test3.phtml Disallow: /test2.phtml Disallow: /robhome.phtml Disallow: /backup/ Disallow: /telecine/temp/ Disallow: /tig3/HTML_Templates/ Disallow: /tig3/HTML_Templates/actualtexts/ # should be a better way-- a directory eventually Disallow: /Jan.wwwstats.html Disallow: /Feb.wwwstats.html Disallow: /Mar.wwwstats.html Disallow: /Apr.wwwstats.html Disallow: /May.wwwstats.html Disallow: /Jun.wwwstats.html Disallow: /Jul.wwwstats.html Disallow: /Aug.wwwstats.html Disallow: /Sep.wwwstats.html Disallow: /Oct.wwwstats.html Disallow: /Nov.wwwstats.html Disallow: /Dec.wwwstats.html Disallow: /wwwstats.html Disallow: /wwwerrs.html Disallow: /error.html Disallow: /jenny/ Disallow: /media/