app/soc/content/robots.txt
author Sverre Rabbelier <sverre@rabbelier.nl>
Mon, 25 May 2009 23:40:07 +0200
changeset 2346 d830123c1be1
parent 73 211a3eeacf27
permissions -rw-r--r--
Do not die on NeedIndexErrors

# Directions for web crawlers.
# See http://www.robotstxt.org/wc/norobots.html.

User-agent: HTTrack
User-agent: puf
User-agent: MSIECrawler
User-agent: Nutch
Disallow: /