# exclude help system from robots User-agent: * Disallow: /manual/ Disallow: /manual-1.3/ Disallow: /manual-2.0/ Disallow: /manual-2.2/ Disallow: /addon-modules/ Disallow: /doc/ Disallow: /images/ # exclude search results Disallow: /hopper/searchresults # exclude old version pages Disallow: /cgi-bin/ Disallow: /Help/ Disallow: /cache/ Disallow: /Articles/ Disallow: /PR/ Disallow: /Texts/ Disallow: /index.html Disallow: /Texts.html Disallow: /art&arch.html Disallow: /PerseusInfo.html Disallow: /startingPoints.html Disallow: /searches.html Disallow: /lexica.html Disallow: /newlatin.html Disallow: /copyright.html # the next line is a spam bot trap, for grepping the logs. you should _really_ change this to something else... Disallow: /all_our_e-mail_addresses # same idea here... Disallow: /admin/ # but allow htdig to index our doc-tree #User-agent: htdig #Disallow: # disallow stress test user-agent: stress-agent Disallow: /