# ----------------------------------------------------------------------- # ROBOTS.TXT # # This file determines what folders/files search engine(s) can/cannot spider. # Place this file in the ROOT web directory (i.e., www.acnielsenhci.com/robots.txt) # ----------------------------------------------------------------------- # # EXAMPLES: # # The following allows all robots to visit all files because the wildcard "*" specifies all robots. # # User-agent: * # Disallow: # # This one keeps all robots out. # # User-agent: * # Disallow: / # # The next one bars all robots from the cgi-bin and images directories: # # User-agent: * # Disallow: /cgi-bin/ # Disallow: /images/ # # This one bans Roverdog from all files on the server: # # User-agent: Roverdog # Disallow: / # # This one bans keeps googlebot from getting at the cheese.htm file: # # User-agent: googlebot # Disallow: cheese.htm # # For more complex examples, try retrieving some of the robots.txt files from the #big sites like Cnn, or Looksmart. # # ----------------------------------------------------------------------- User-agent: * Disallow: /access/ Disallow: /docs/ Disallow: /images/ Disallow: /include/ Disallow: /js/ Disallow: /logs/ Disallow: /survey/ Disallow: /temp/ Disallow: /runserv/ Disallow: /auth/ Disallow: /scn/