Author: snagel
Date: Mon Nov 16 20:29:33 2015
New Revision: 1714655

URL: http://svn.apache.org/viewvc?rev=1714655&view=rev
Log:
NUTCH-2130 copyField rawcontent creates error within schema.xml

Modified:
    nutch/branches/2.x/CHANGES.txt
    nutch/branches/2.x/conf/schema.xml

Modified: nutch/branches/2.x/CHANGES.txt
URL: 
http://svn.apache.org/viewvc/nutch/branches/2.x/CHANGES.txt?rev=1714655&r1=1714654&r2=1714655&view=diff
==============================================================================
--- nutch/branches/2.x/CHANGES.txt (original)
+++ nutch/branches/2.x/CHANGES.txt Mon Nov 16 20:29:33 2015
@@ -3,6 +3,8 @@ Nutch Change Log
 Nutch 2.3.1 Release 22092015 (ddmmyyyy)
 Release Report - http://s.apache.org/nutch_2.3.1
 
+* NUTCH-2130 copyField rawcontent creates error within schema.xml (Sherban 
Drulea, lewismc, snagel)
+
 * NUTCH-2018 Ensure that the Docker containers for Nutch 2.X are part of the 
Release Management Documentation (lewismc)
 
 * NUTCH-2105 Update Nutch Cassandra Dockerfile to work with Gora Nutch 2.3.1 
(lewismc)

Modified: nutch/branches/2.x/conf/schema.xml
URL: 
http://svn.apache.org/viewvc/nutch/branches/2.x/conf/schema.xml?rev=1714655&r1=1714654&r2=1714655&view=diff
==============================================================================
--- nutch/branches/2.x/conf/schema.xml (original)
+++ nutch/branches/2.x/conf/schema.xml Mon Nov 16 20:29:33 2015
@@ -32,6 +32,7 @@
     <!-- The StrField type is not analyzed, but indexed/stored verbatim. -->
     <fieldType name="string" class="solr.StrField" sortMissingLast="true" 
omitNorms="true"/>
 
+    <fieldtype name="binary" class="solr.BinaryField"/>
 
     <!--
       Default numeric field types. For faster range queries, consider the 
tint/tfloat/tlong/tdouble types.
@@ -357,6 +358,12 @@
 
     <!-- fields for tld plugin -->    
     <field name="tld" type="string" stored="false" indexed="false"/>
+
+    <!-- fields for index-html plugin
+         Note: although raw document content may be binary,
+               index-html adds a String to the index field -->
+    <field name="rawcontent" type="string" stored="true" indexed="false"/>
+
  </fields>
  <uniqueKey>id</uniqueKey>
  <defaultSearchField>text</defaultSearchField>
@@ -367,7 +374,6 @@
         or to add multiple fields to the same field for easier/faster 
searching.  -->
 
  <copyField source="content" dest="text"/>
- <copyField source="rawcontent" dest="text"/>
  <copyField source="url" dest="text"/>
  <copyField source="title" dest="text"/>
  <copyField source="anchor" dest="text"/>


Reply via email to