#******************************************************************************* # # Control access by search engines, crawlers, spiders, or robots. # # This file must be named robots.txt in the root directory of the web site. # #------------------------------------------------------------------------------- # # Note: See RFC 1808 and draft-koster-robots-00.txt. # #******************************************************************************* # Last modified: 07.18.05 mo #******************************************************************************* User-Agent: sitecheck.internetseer.com Disallow: / User-Agent: LinkWalker Disallow: / User-agent: * # Affects all robots Disallow: /_ # FrontPage and Dreamweaver control files/dirs Disallow: /Library/ # Dreamweaver library Disallow: /Templates/ # Dreamweaver templates Disallow: /tmp/ # Private working directory Disallow: /private/ # Private working directory Disallow: /test/ # Private working directory Disallow: /incoming/ # Private working directory Disallow: /images/ # Images Disallow: /logs/ # Log files Disallow: /Orgs/ # External database using PHP Disallow: /archive/ # backup of previous web site Disallow: /new/ # Private working directory Disallow: /ar/ # Statistics directory Disallow: /cgi/ # Executable script directory Disallow: /cgi-bin/ # Executable script directory Disallow: /cgi # Executable CGI programs Disallow: /JS/ # Executable Javascript programs Disallow: /pl # Executable PERL programs Disallow: /CJ38 # Don't Cache SORegistry Data