# a standard robots exclusion file that excludes all # but the most significant robots from visiting your site # the default Disallow rule permits all of your web to be # crawled by the allowed agents, you will want to change this # see http://info.webcrawler.com/mak/projects/robots/exclusion.html # for further details User-agent: * Disallow: /financial/ User-agent: MSR-ISRCCrawler Disallow: / User-agent: Nutch Spider/Nutch-1.0-dev Disallow: / User-agent: LTI/LemurProject Disallow: / User-agent: archive.org_bot Disallow: User-agent: LiteFinder/1.0 Disallow: / User-agent: * Disallow: /MMO/ User-agent: * Disallow: /business/positions/ User-agent: NextGenSearchBot Disallow: / #User-agent: Googlebot/2.1 # best search site #Disallow: /phpdoc/ #User-agent: webcollage/1.54 # interesting site #Disallow: /phpdoc/ #User-agent: ru-robot/1.0 # rutgers univ ? #Disallow: /phpdoc/ #User-agent: Netscape-Catalog-Robot/1.01 # The Netscape Catalog #Disallow: /phpdoc/ #User-agent: ArchitextSpider # the eXcite robot #Disallow: /phpdoc/ #User-agent: InfoSeek Sidewinder # the InfoSeek robot #Disallow: /phpdoc/ #User-agent: InfoSeek Robot 1.0 # the InfoSeek robot #Disallow: /phpdoc/ #User-agent: Scooter/1.0 # The AltaVista robot #Disallow: /phpdoc/ #User-agent: Scooter_Mercator_1-1.0 # The AltaVista robot ?? #Disallow: /phpdoc/ #User-agent: Lycos # The Lycos robot #Disallow: /phpdoc/ #User-agent: Muscat/Ferret # The Euroferret #Disallow: /phpdoc/ #User-agent: Slurp # The HotBot from inktomi #Disallow: /phpdoc/ #User-agent: Webcrawler/3.0 Robot libwww/5.0a # The WebCrawler #Disallow: /phpdoc/ User-agent: * # Try to block the ncpmounted stuff and the webfiles Disallow: /OGS1/ Disallow: /OGS_BS1/ Disallow: /phpdoc/ Disallow: /webfiles/ # tell all other robots to go away # User-agent: * # Disallow: /