Author: jnioche
Date: Mon Nov 18 12:08:45 2013
New Revision: 1543010
URL: http://svn.apache.org/r1543010
Log:
NUTCH-1668 Remove package org.apache.nutch.indexer.solr
Removed:
nutch/trunk/src/java/org/apache/nutch/indexer/solr/
Modified:
nutch/trunk/CHANGES.txt
nutch/trunk/ivy/ivy.xml
nutch/trunk/src/bin/nutch
nutch/trunk/src/java/org/apache/nutch/indexer/IndexingJob.java
Modified: nutch/trunk/CHANGES.txt
URL:
http://svn.apache.org/viewvc/nutch/trunk/CHANGES.txt?rev=1543010&r1=1543009&r2=1543010&view=diff
==============================================================================
--- nutch/trunk/CHANGES.txt (original)
+++ nutch/trunk/CHANGES.txt Mon Nov 18 12:08:45 2013
@@ -2,6 +2,8 @@ Nutch Change Log
Nutch Development Trunk
+* NUTCH-1668 Remove package org.apache.nutch.indexer.solr (jnioche)
+
* NUTCH-1621 Remove deprecated class o.a.n.crawl.Crawler (Rui Gao via jnioche)
* NUTCH-656 Generic Deduplicator (jnioche, snagel)
Modified: nutch/trunk/ivy/ivy.xml
URL:
http://svn.apache.org/viewvc/nutch/trunk/ivy/ivy.xml?rev=1543010&r1=1543009&r2=1543010&view=diff
==============================================================================
--- nutch/trunk/ivy/ivy.xml (original)
+++ nutch/trunk/ivy/ivy.xml Mon Nov 18 12:08:45 2013
@@ -34,11 +34,8 @@
</publications>
<dependencies>
- <dependency org="org.elasticsearch" name="elasticsearch"
rev="0.90.1"
- conf="*->default"/>
-
- <dependency org="org.apache.solr" name="solr-solrj" rev="3.4.0"
- conf="*->default" />
+ <dependency org="org.elasticsearch" name="elasticsearch"
+ rev="0.90.1" conf="*->default" />
<dependency org="org.slf4j" name="slf4j-api" rev="1.6.1"
conf="*->master" />
@@ -77,7 +74,8 @@
<dependency org="oro" name="oro" rev="2.0.8" />
<dependency org="com.google.guava" name="guava" rev="11.0.2" />
- <dependency org="com.google.code.crawler-commons"
name="crawler-commons" rev="0.2" />
+ <dependency org="com.google.code.crawler-commons"
name="crawler-commons"
+ rev="0.2" />
<!--Configuration: test -->
Modified: nutch/trunk/src/bin/nutch
URL:
http://svn.apache.org/viewvc/nutch/trunk/src/bin/nutch?rev=1543010&r1=1543009&r2=1543010&view=diff
==============================================================================
--- nutch/trunk/src/bin/nutch (original)
+++ nutch/trunk/src/bin/nutch Mon Nov 18 12:08:45 2013
@@ -61,10 +61,11 @@ if [ $# = 0 ]; then
echo " invertlinks create a linkdb from parsed segments"
echo " mergelinkdb merge linkdb-s, with optional filtering"
echo " index run the plugin-based indexer on parsed segments
and linkdb"
- echo " solrindex run the solr indexer on parsed segments and linkdb"
- echo " solrdedup remove duplicates from solr"
- echo " solrclean remove HTTP 301 and 404 documents from solr"
- echo " clean remove HTTP 301 and 404 documents from indexing
backends configured via plugins"
+ echo " dedup deduplicate entries in the crawldb and give them a
special status"
+ echo " solrindex run the solr indexer on parsed segments and linkdb
- DEPRECATED use the index command instead"
+ echo " solrdedup remove duplicates from solr - DEPRECATED use the
dedup command instead"
+ echo " solrclean remove HTTP 301 and 404 documents from solr -
DEPRECATED use the clean command instead"
+ echo " clean remove HTTP 301 and 404 documents and duplicates
from indexing backends configured via plugins"
echo " parsechecker check the parser for a given url"
echo " indexchecker check the indexing filters for a given url"
echo " domainstats calculate domain statistics from crawldb"
@@ -226,7 +227,8 @@ elif [ "$COMMAND" = "solrindex" ] ; then
elif [ "$COMMAND" = "index" ] ; then
CLASS=org.apache.nutch.indexer.IndexingJob
elif [ "$COMMAND" = "solrdedup" ] ; then
- CLASS=org.apache.nutch.indexer.solr.SolrDeleteDuplicates
+ echo "Command $COMMAND is deprecated, please use dedup instead"
+ exit -1
elif [ "$COMMAND" = "dedup" ] ; then
CLASS=org.apache.nutch.crawl.DeduplicationJob
elif [ "$COMMAND" = "solrclean" ] ; then
Modified: nutch/trunk/src/java/org/apache/nutch/indexer/IndexingJob.java
URL:
http://svn.apache.org/viewvc/nutch/trunk/src/java/org/apache/nutch/indexer/IndexingJob.java?rev=1543010&r1=1543009&r2=1543010&view=diff
==============================================================================
--- nutch/trunk/src/java/org/apache/nutch/indexer/IndexingJob.java (original)
+++ nutch/trunk/src/java/org/apache/nutch/indexer/IndexingJob.java Mon Nov 18
12:08:45 2013
@@ -33,7 +33,6 @@ import org.apache.hadoop.mapred.JobConf;
import org.apache.hadoop.util.StringUtils;
import org.apache.hadoop.util.Tool;
import org.apache.hadoop.util.ToolRunner;
-import org.apache.nutch.indexer.solr.SolrConstants;
import org.apache.nutch.util.HadoopFSUtil;
import org.apache.nutch.util.NutchConfiguration;
import org.apache.nutch.util.NutchJob;
@@ -57,14 +56,6 @@ public class IndexingJob extends Configu
super(conf);
}
- public void index(Path crawlDb, Path linkDb, List<Path> segments)
- throws IOException {
- // SOLR SPECIFIC COMMIT PARAM USED BY CRAWL CLASS
- boolean noCommit = !getConf().getBoolean(SolrConstants.COMMIT_INDEX,
- true);
- index(crawlDb, linkDb, segments, noCommit, false, null);
- }
-
public void index(Path crawlDb, Path linkDb, List<Path> segments,
boolean noCommit) throws IOException {
index(crawlDb, linkDb, segments, noCommit, false, null);