Author: markus Date: Tue Sep 15 06:51:48 2015 New Revision: 1703111 URL: http://svn.apache.org/r1703111 Log: NUTCH-2093 Indexing filters to use current signatures
Modified: nutch/trunk/CHANGES.txt nutch/trunk/src/java/org/apache/nutch/indexer/IndexerMapReduce.java Modified: nutch/trunk/CHANGES.txt URL: http://svn.apache.org/viewvc/nutch/trunk/CHANGES.txt?rev=1703111&r1=1703110&r2=1703111&view=diff ============================================================================== --- nutch/trunk/CHANGES.txt (original) +++ nutch/trunk/CHANGES.txt Tue Sep 15 06:51:48 2015 @@ -2,6 +2,8 @@ Nutch Change Log Nutch Current Development 1.11-SNAPSHOT +* NUTCH-2093 Indexing filters to use current signatures (markus) + * NUTCH-2092: Unit Test for NutchServer (Sujen Shah via mattmann) * NUTCH-2096 Explicitly indicate broswer binary to use when selecting Modified: nutch/trunk/src/java/org/apache/nutch/indexer/IndexerMapReduce.java URL: http://svn.apache.org/viewvc/nutch/trunk/src/java/org/apache/nutch/indexer/IndexerMapReduce.java?rev=1703111&r1=1703110&r2=1703111&view=diff ============================================================================== --- nutch/trunk/src/java/org/apache/nutch/indexer/IndexerMapReduce.java (original) +++ nutch/trunk/src/java/org/apache/nutch/indexer/IndexerMapReduce.java Tue Sep 15 06:51:48 2015 @@ -287,6 +287,9 @@ public class IndexerMapReduce extends Co final Parse parse = new ParseImpl(parseText, parseData); try { + // Indexing filters may also be interested in the signature + fetchDatum.setSignature(dbDatum.getSignature()); + // extract information from dbDatum and pass it to // fetchDatum so that indexing filters can use it final Text url = (Text) dbDatum.getMetaData().get(