#******************************************************************************* # # Control access by search engines, crawlers, spiders, or robots. # # This file must be named robots.txt in the root directory of the web site. # #------------------------------------------------------------------------------- # # Note: See RFC 1808 and draft-koster-robots-00.txt. # #******************************************************************************* # Last modified: 11.16.07 oa #******************************************************************************* User-agent: sitecheck.internetseer.com Disallow: / User-agent: LinkWalker Disallow: / User-agent: * # Affects all robots Disallow: /ar/ Disallow: /bp/projections/ Disallow: /cgi # Executable CGI programs Disallow: /cgi-bin/ # Private working directory Disallow: /Expression/ # Private working directory Disallow: /fmdc/js # Excutabale Javascript programs Disallow: /images Disallow: /itsd-old/ # Old working directory Disallow: /js # Executable Javascript programs Disallow: /jpg Disallow: /logs # Log files Disallow: /mail/ Disallow: /new/ Disallow: /newsimg/ Disallow: /portal/ Disallow: /pl # Executable PERL programs Disallow: /shultz/ # Private working directory Disallow: /ssi Disallow: /uid # Private working directory Disallow: /oeo/ #old directory but some files being used by programs Disallow: /oaginc/ Disallow: /xml/ Disallow: /mo/functions/ Disallow: /mo/cities/ Disallow: /mo/agencies/ Disallow: /mo/cgi-bin/