Author: markus
Date: Mon Jan 2 13:16:59 2012
New Revision: 1226409
URL: http://svn.apache.org/viewvc?rev=1226409&view=rev
Log:
NUTCH-1232 Remove site field from index-basic
Modified:
nutch/trunk/CHANGES.txt
nutch/trunk/conf/schema-solr4.xml
nutch/trunk/conf/schema.xml
nutch/trunk/conf/solrindex-mapping.xml
nutch/trunk/src/plugin/index-basic/src/java/org/apache/nutch/indexer/basic/BasicIndexingFilter.java
Modified: nutch/trunk/CHANGES.txt
URL:
http://svn.apache.org/viewvc/nutch/trunk/CHANGES.txt?rev=1226409&r1=1226408&r2=1226409&view=diff
==============================================================================
--- nutch/trunk/CHANGES.txt (original)
+++ nutch/trunk/CHANGES.txt Mon Jan 2 13:16:59 2012
@@ -1,5 +1,7 @@
Nutch Change Log
+* NUTCH-1232 Remove site field from index-basic (markus)
+
* NUTCH-1239 Webgraph should remove deleted pages from segment input (markus)
* NUTCH-1238 Fetcher throughput threshold must start before feeder finished
(markus)
Modified: nutch/trunk/conf/schema-solr4.xml
URL:
http://svn.apache.org/viewvc/nutch/trunk/conf/schema-solr4.xml?rev=1226409&r1=1226408&r2=1226409&view=diff
==============================================================================
--- nutch/trunk/conf/schema-solr4.xml (original)
+++ nutch/trunk/conf/schema-solr4.xml Mon Jan 2 13:16:59 2012
@@ -310,7 +310,6 @@
<!-- fields for index-basic plugin -->
<field name="host" type="url" stored="false" indexed="true"/>
- <field name="site" type="string" stored="false" indexed="true"/>
<field name="url" type="url" stored="true" indexed="true" required="true"/>
<!-- stored=true for highlighting, use term vectors and positions for
fast highlighting -->
<field name="content" type="text_general" stored="true" indexed="true"/>
Modified: nutch/trunk/conf/schema.xml
URL:
http://svn.apache.org/viewvc/nutch/trunk/conf/schema.xml?rev=1226409&r1=1226408&r2=1226409&view=diff
==============================================================================
--- nutch/trunk/conf/schema.xml (original)
+++ nutch/trunk/conf/schema.xml Mon Jan 2 13:16:59 2012
@@ -22,6 +22,7 @@
https://issues.apache.org/jira/browse/NUTCH-994
https://issues.apache.org/jira/browse/NUTCH-997
https://issues.apache.org/jira/browse/NUTCH-1058
+ https://issues.apache.org/jira/browse/NUTCH-1232
and
http://svn.apache.org/viewvc/lucene/dev/branches/branch_3x/solr/
example/solr/conf/schema.xml?view=markup
@@ -73,8 +74,7 @@
<field name="boost" type="float" stored="true" indexed="false"/>
<!-- fields for index-basic plugin -->
- <field name="host" type="url" stored="false" indexed="true"/>
- <field name="site" type="string" stored="false" indexed="true"/>
+ <field name="host" type="string" stored="false" indexed="true"/>
<field name="url" type="url" stored="true" indexed="true"
required="true"/>
<field name="content" type="text" stored="false" indexed="true"/>
Modified: nutch/trunk/conf/solrindex-mapping.xml
URL:
http://svn.apache.org/viewvc/nutch/trunk/conf/solrindex-mapping.xml?rev=1226409&r1=1226408&r2=1226409&view=diff
==============================================================================
--- nutch/trunk/conf/solrindex-mapping.xml (original)
+++ nutch/trunk/conf/solrindex-mapping.xml Mon Jan 2 13:16:59 2012
@@ -32,7 +32,6 @@
-->
<fields>
<field dest="content" source="content"/>
- <field dest="site" source="site"/>
<field dest="title" source="title"/>
<field dest="host" source="host"/>
<field dest="segment" source="segment"/>
Modified:
nutch/trunk/src/plugin/index-basic/src/java/org/apache/nutch/indexer/basic/BasicIndexingFilter.java
URL:
http://svn.apache.org/viewvc/nutch/trunk/src/plugin/index-basic/src/java/org/apache/nutch/indexer/basic/BasicIndexingFilter.java?rev=1226409&r1=1226408&r2=1226409&view=diff
==============================================================================
---
nutch/trunk/src/plugin/index-basic/src/java/org/apache/nutch/indexer/basic/BasicIndexingFilter.java
(original)
+++
nutch/trunk/src/plugin/index-basic/src/java/org/apache/nutch/indexer/basic/BasicIndexingFilter.java
Mon Jan 2 13:16:59 2012
@@ -67,7 +67,6 @@ public class BasicIndexingFilter impleme
if (host != null) {
doc.add("host", host);
- doc.add("site", host);
}
doc.add("url", reprUrlString == null ? urlString : reprUrlString);