[Yanel-commits] rev 26472 -
public/yanel/trunk/src/realms/yanel-website/content/nutch-config
michi at wyona.com
michi at wyona.com
Thu Aug 2 14:12:36 CEST 2007
Author: michi
Date: 2007-08-02 14:12:36 +0200 (Thu, 02 Aug 2007)
New Revision: 26472
Added:
public/yanel/trunk/src/realms/yanel-website/content/nutch-config/nutch-local-yanel-ml-usage.xml
Log:
usage config added
Added: public/yanel/trunk/src/realms/yanel-website/content/nutch-config/nutch-local-yanel-ml-usage.xml
===================================================================
--- public/yanel/trunk/src/realms/yanel-website/content/nutch-config/nutch-local-yanel-ml-usage.xml (rev 0)
+++ public/yanel/trunk/src/realms/yanel-website/content/nutch-config/nutch-local-yanel-ml-usage.xml 2007-08-02 12:12:36 UTC (rev 26472)
@@ -0,0 +1,24 @@
+<?xml version="1.0"?>
+
+<configuration>
+
+ <property>
+ <name>searcher.dir</name>
+<!--
+ <value>/home/ulysses/src/crawl_yanel_mailing-lists_usage_dev_20070113</value>
+-->
+ <value>/home/michi/src/wyona/extra/ipi/nutch/trunk/crawl_yanel_ml_usage_2007.08.02</value>
+ <description>
+ Path to root of crawl. This directory is searched (in
+ order) for either the file search-servers.txt, containing a list of
+ distributed search servers, or the directory "index" containing
+ merged indexes, or the directory "segments" containing segment
+ indexes.
+ </description>
+ </property>
+
+ <property>
+ <name>plugin.includes</name>
+ <value>nutch-extensionpoints|protocol-file|protocol-http|ontology|languageidentifier|analysis-(fr|en|de)|urlfilter-regex|parse-(text|pdf|mspowerpoint|msword|msexcel|rtf|rss|html|zip)|index-basic|query-(basic|site|url)|lib-jakarta-poi|lib-lucene-analyzers|scoring-opic</value>
+ </property>
+</configuration>
More information about the Yanel-commits
mailing list