This is an automated email from the ASF dual-hosted git repository.

lewismc pushed a commit to branch master
in repository https://gitbox.apache.org/repos/asf/nutch.git


The following commit(s) were added to refs/heads/master by this push:
     new 5250d62  NUTCH-2851 Random object created and used only once (#571)
5250d62 is described below

commit 5250d62986468b23509a82d2aaa32bdc11cf02a8
Author: Lewis John McGibbney <lewis.mcgibb...@gmail.com>
AuthorDate: Thu Feb 18 07:20:59 2021 -0800

    NUTCH-2851 Random object created and used only once (#571)
---
 src/java/org/apache/nutch/crawl/Generator.java       | 5 +++--
 src/java/org/apache/nutch/indexer/IndexingJob.java   | 4 +++-
 src/java/org/apache/nutch/segment/SegmentReader.java | 5 ++++-
 src/java/org/apache/nutch/tools/DmozParser.java      | 5 ++++-
 4 files changed, 14 insertions(+), 5 deletions(-)

diff --git a/src/java/org/apache/nutch/crawl/Generator.java 
b/src/java/org/apache/nutch/crawl/Generator.java
index dcba9bf..00eb18f 100644
--- a/src/java/org/apache/nutch/crawl/Generator.java
+++ b/src/java/org/apache/nutch/crawl/Generator.java
@@ -35,7 +35,6 @@ import org.apache.hadoop.conf.Configurable;
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
 import org.apache.commons.jexl3.JexlExpression;
-import org.antlr.v4.parse.ANTLRParser.throwsSpec_return;
 import org.apache.commons.jexl3.JexlContext;
 import org.apache.commons.jexl3.MapContext;
 import org.apache.hadoop.mapreduce.Counter;
@@ -90,6 +89,8 @@ import org.apache.nutch.util.URLUtil;
  **/
 public class Generator extends NutchTool implements Tool {
 
+  private static final Random RANDOM = new Random();
+
   protected static final Logger LOG = LoggerFactory
       .getLogger(MethodHandles.lookup().lookupClass());
 
@@ -1013,7 +1014,7 @@ public class Generator extends NutchTool implements Tool {
     Job job = NutchJob.getInstance(getConf());
     job.setJobName("generate: partition " + segment);
     Configuration conf = job.getConfiguration();
-    conf.setInt("partition.url.seed", new Random().nextInt());
+    conf.setInt("partition.url.seed", RANDOM.nextInt());
 
     FileInputFormat.addInputPath(job, inputDir);
     job.setInputFormatClass(SequenceFileInputFormat.class);
diff --git a/src/java/org/apache/nutch/indexer/IndexingJob.java 
b/src/java/org/apache/nutch/indexer/IndexingJob.java
index 0966276..0fe29a7 100644
--- a/src/java/org/apache/nutch/indexer/IndexingJob.java
+++ b/src/java/org/apache/nutch/indexer/IndexingJob.java
@@ -54,6 +54,8 @@ import org.slf4j.LoggerFactory;
 
 public class IndexingJob extends NutchTool implements Tool {
 
+  private static final Random RANDOM = new Random();
+
   private static final Logger LOG = LoggerFactory
       .getLogger(MethodHandles.lookup().lookupClass());
 
@@ -136,7 +138,7 @@ public class IndexingJob extends NutchTool implements Tool {
     job.setReduceSpeculativeExecution(false);
 
     final Path tmp = new Path("tmp_" + System.currentTimeMillis() + "-"
-        + new Random().nextInt());
+        + RANDOM.nextInt());
 
     FileOutputFormat.setOutputPath(job, tmp);
     try {
diff --git a/src/java/org/apache/nutch/segment/SegmentReader.java 
b/src/java/org/apache/nutch/segment/SegmentReader.java
index 284daed..2f2fefd 100644
--- a/src/java/org/apache/nutch/segment/SegmentReader.java
+++ b/src/java/org/apache/nutch/segment/SegmentReader.java
@@ -35,6 +35,7 @@ import java.util.HashMap;
 import java.util.Iterator;
 import java.util.List;
 import java.util.Map;
+import java.util.Random;
 
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
@@ -74,6 +75,8 @@ import org.apache.nutch.util.SegmentReaderUtil;
 /** Dump the content of a segment. */
 public class SegmentReader extends Configured implements Tool {
 
+  private static final Random RANDOM = new Random();
+
   private static final Logger LOG = LoggerFactory
       .getLogger(MethodHandles.lookup().lookupClass());
 
@@ -220,7 +223,7 @@ public class SegmentReader extends Configured implements 
Tool {
     job.setJarByClass(SegmentReader.class);
 
     Path tempDir = new Path(conf.get("hadoop.tmp.dir", "/tmp") + "/segread-"
-        + new java.util.Random().nextInt());
+        + RANDOM.nextInt());
     FileSystem fs = tempDir.getFileSystem(conf);
     fs.delete(tempDir, true);
 
diff --git a/src/java/org/apache/nutch/tools/DmozParser.java 
b/src/java/org/apache/nutch/tools/DmozParser.java
index b68facb..8db4817 100644
--- a/src/java/org/apache/nutch/tools/DmozParser.java
+++ b/src/java/org/apache/nutch/tools/DmozParser.java
@@ -54,6 +54,9 @@ import org.apache.nutch.util.NutchConfiguration;
  * RDF into a flat file of URLs to be injected. 
  */
 public class DmozParser {
+
+  private static final Random RANDOM = new Random();
+
   private static final Logger LOG = LoggerFactory
       .getLogger(MethodHandles.lookup().lookupClass());
 
@@ -134,7 +137,7 @@ public class DmozParser {
       this.includeAdult = includeAdult;
       this.topicPattern = topicPattern;
 
-      this.hashSkew = skew != 0 ? skew : new Random().nextInt();
+      this.hashSkew = skew != 0 ? skew : RANDOM.nextInt();
     }
 
     //

Reply via email to