Author: lewismc
Date: Thu Jul 31 01:22:58 2014
New Revision: 1614801
URL: http://svn.apache.org/r1614801
Log:
NUTCH-1819 Check for batchId input in GeneratorJob#run
Modified:
nutch/branches/2.x/CHANGES.txt
nutch/branches/2.x/src/java/org/apache/nutch/crawl/GeneratorJob.java
Modified: nutch/branches/2.x/CHANGES.txt
URL:
http://svn.apache.org/viewvc/nutch/branches/2.x/CHANGES.txt?rev=1614801&r1=1614800&r2=1614801&view=diff
==============================================================================
--- nutch/branches/2.x/CHANGES.txt (original)
+++ nutch/branches/2.x/CHANGES.txt Thu Jul 31 01:22:58 2014
@@ -2,6 +2,8 @@ Nutch Change Log
Current Development
+* NUTCH-1819 batchId in GeneratorJob ( Fjodor Vershinin via lewismc)
+
* NUTCH-1708 use same id when indexing and deleting redirects (snagel)
* NUTCH-1817 Remove pom.xml from source (jnioche)
Modified: nutch/branches/2.x/src/java/org/apache/nutch/crawl/GeneratorJob.java
URL:
http://svn.apache.org/viewvc/nutch/branches/2.x/src/java/org/apache/nutch/crawl/GeneratorJob.java?rev=1614801&r1=1614800&r2=1614801&view=diff
==============================================================================
--- nutch/branches/2.x/src/java/org/apache/nutch/crawl/GeneratorJob.java
(original)
+++ nutch/branches/2.x/src/java/org/apache/nutch/crawl/GeneratorJob.java Thu
Jul 31 01:22:58 2014
@@ -161,6 +161,11 @@ public class GeneratorJob extends NutchT
}
public Map<String,Object> run(Map<String,Object> args) throws Exception {
+ String batchId = (String)args.get(Nutch.ARG_BATCH);
+ if (batchId != null) {
+ getConf().set(GeneratorJob.BATCH_ID, batchId);
+ }
+
// map to inverted subset due for fetch, sort by score
Long topN = (Long)args.get(Nutch.ARG_TOPN);
Long curTime = (Long)args.get(Nutch.ARG_CURTIME);