Version 1 (modified by 14 years ago) (diff) | ,
---|
/etc/init.d/tomcat
is set to /usr/wwwapps/crawldir
http://today.java.net/pub/a/today/2006/01/10/introduction-to-nutch-1.html[[BR]] http://today.java.net/pub/a/today/2006/02/16/introduction-to-nutch-2.html
http://www.folge2.de/tp/search/1/crawling-the-local-filesystem-with-nutch
nutch-site.xml
add:
<property> <name>searcher.dir</name> <value>/usr/wwwapps/crawl_data/crawl</value> <description>Path to root of crawl</description> </property>
recreate crawl dir:
mkdir /usr/wwwapps/crawl_data/
mkdir urls
create files
add file:///FILES/