# robots.txt for http://blog.jesusdomain.org/ # $Id: robots.txt,v 1.9 2002/9/27 13:13:08 GrandWebTraffic $ # # This is a file retrieved by search engines a.k.a. webcrawlers, spiders that # conform to a defacto standard. # See # See # # The HostMaster for this site is # # Format is: # User-agent: # Disallow: | # Flag Date By Reason # $L1= 19970130 GrandAccess First Version # $L2= 19980909 GrandAccess fixed url since make move to Domain Name # $L3= 10990811 GrandAccess Updated Engines # $L5= 20040427 GrandAccess Updated disallow rules # $L5= 20070729 GrandAccess Updated for New sites # ----------------------------------------------------------------------------- User-agent: * Disallow: /cgi-bin/ Disallow: /images/ User-agent: GoogleBot Disallow: /cgi-bin/ Disallow: /images/ User-agent: cybermapper Disallow: /cgi-bin/ Disallow: /images/ User-agent: W3Crobot/1 Disallow: /cgi-bin/ Disallow: /images/ User-agent: AltaVista Intranet V2.0 W3C Webreq Disallow: /cgi-bin/ Disallow: /images/ User-agent: Mozilla/3.01 (hotwired-test/0.1) Disallow: /cgi-bin/ Disallow: /images/ User-agent: Slurp Disallow: /cgi-bin/ Disallow: /images/ User-agent: Scooter Disallow: /cgi-bin/ Disallow: /images/ User-agent: Ultraseek Disallow: /cgi-bin/ Disallow: /images/ User-agent: smallbear Disallow: /cgi-bin/ Disallow: /images/ User-Agent: Fast corporate crawler Disallow: /cgi-bin/ Disallow: /images/