# D:\dh\web\NSC\3\HTM\robots.txt (49 lines) 2007-06-13 05:39 Dean Hannotte # #----------------------------------------------------------------------# # NOTE: Lines in this file must end in LF's, not CRLF's. # # In KEDIT, issue 'eolout lf'. # #----------------------------------------------------------------------# # # # Extracts from 'http://www.robotstxt.org/wc/norobots.html' # # # # User-agent # # The value of this field is the name of the robot the record is # # describing access policy for. # # # # If more than one User-agent field is present the record # # describes an identical access policy for more than one robot. At # # least one field needs to be present per record. # # # # The robot should be liberal in interpreting this field. A case # # insensitive substring match of the name without version information # # is recommended. # # # # If the value is '*', the record describes the default access # # policy for any robot that has not matched any of the other records. # # It is not allowed to have multiple such records in the "/robots.txt" # # file. # # # # Disallow # # The value of this field specifies a partial URL that is not to # # be visited. This can be a full path, or a partial path; any URL that # # starts with this value will not be retrieved. For example, Disallow: # # /help disallows both /help.html and /help/index.html, whereas # # Disallow: /help/ would disallow /help/index.html but allow # # /help.html. # # # # Any empty value, indicates that all URLs can be retrieved. At # # least one Disallow field needs to be present in a record. # # # #----------------------------------------------------------------------# User-agent: * Disallow: /cgi-bin/ # anything in the /cgi-bin directory Disallow: /_ # Disallow: /0_readme # msg from geocities Disallow: /_jenfavs # Disallow: /Chat-1 # Disallow: /Chat # both chat.htm and chats.htm Disallow: /Dean1975 # Disallow: /RosenBKP # Disallow: /RosenCat # Disallow: /ws_ftp #