[Yanel-commits] rev 26472 - public/yanel/trunk/src/realms/yanel-website/content/nutch-config

michi at wyona.com michi at wyona.com
Thu Aug 2 14:12:36 CEST 2007


Author: michi
Date: 2007-08-02 14:12:36 +0200 (Thu, 02 Aug 2007)
New Revision: 26472

Added:
   public/yanel/trunk/src/realms/yanel-website/content/nutch-config/nutch-local-yanel-ml-usage.xml
Log:
usage config added

Added: public/yanel/trunk/src/realms/yanel-website/content/nutch-config/nutch-local-yanel-ml-usage.xml
===================================================================
--- public/yanel/trunk/src/realms/yanel-website/content/nutch-config/nutch-local-yanel-ml-usage.xml	                        (rev 0)
+++ public/yanel/trunk/src/realms/yanel-website/content/nutch-config/nutch-local-yanel-ml-usage.xml	2007-08-02 12:12:36 UTC (rev 26472)
@@ -0,0 +1,24 @@
+<?xml version="1.0"?>
+
+<configuration>
+
+  <property>
+    <name>searcher.dir</name>
+<!--
+    <value>/home/ulysses/src/crawl_yanel_mailing-lists_usage_dev_20070113</value>
+-->
+    <value>/home/michi/src/wyona/extra/ipi/nutch/trunk/crawl_yanel_ml_usage_2007.08.02</value>
+    <description>
+    Path to root of crawl.  This directory is searched (in
+    order) for either the file search-servers.txt, containing a list of
+    distributed search servers, or the directory "index" containing
+    merged indexes, or the directory "segments" containing segment
+    indexes.
+    </description>
+  </property>
+  
+  <property>
+    <name>plugin.includes</name> 
+     <value>nutch-extensionpoints|protocol-file|protocol-http|ontology|languageidentifier|analysis-(fr|en|de)|urlfilter-regex|parse-(text|pdf|mspowerpoint|msword|msexcel|rtf|rss|html|zip)|index-basic|query-(basic|site|url)|lib-jakarta-poi|lib-lucene-analyzers|scoring-opic</value>
+  </property>
+</configuration>



More information about the Yanel-commits mailing list