Author: jnioche
Date: Sat Oct 20 09:14:40 2012
New Revision: 1400397
URL: http://svn.apache.org/viewvc?rev=1400397&view=rev
Log:
NUTCH-1433 Upgrade to Tika 1.2
Modified:
nutch/branches/2.x/CHANGES.txt
nutch/branches/2.x/ivy/ivy.xml
nutch/branches/2.x/src/plugin/parse-tika/ivy.xml
nutch/branches/2.x/src/plugin/parse-tika/plugin.xml
Modified: nutch/branches/2.x/CHANGES.txt
URL:
http://svn.apache.org/viewvc/nutch/branches/2.x/CHANGES.txt?rev=1400397&r1=1400396&r2=1400397&view=diff
==============================================================================
--- nutch/branches/2.x/CHANGES.txt (original)
+++ nutch/branches/2.x/CHANGES.txt Sat Oct 20 09:14:40 2012
@@ -2,6 +2,8 @@ Nutch Change Log
Release 2.2 - Current Development
+* NUTCH-1433 Upgrade to Tika 1.2 (jnioche)
+
* NUTCH-1087 Deprecate crawl command and replace with example script (jnioche)
* NUTCH-874 Make sure all plugins in src/plugin are compatible with Nutch 2.0
and Gora (part 1) (Kiran Chitturi via lewismc)
Modified: nutch/branches/2.x/ivy/ivy.xml
URL:
http://svn.apache.org/viewvc/nutch/branches/2.x/ivy/ivy.xml?rev=1400397&r1=1400396&r2=1400397&view=diff
==============================================================================
--- nutch/branches/2.x/ivy/ivy.xml (original)
+++ nutch/branches/2.x/ivy/ivy.xml Sat Oct 20 09:14:40 2012
@@ -58,10 +58,8 @@
</dependency>
<dependency org="com.ibm.icu" name="icu4j" rev="4.0.1" />
- <dependency org="org.apache.tika" name="tika-core" rev="1.1" />
- <!--
- <dependency org="org.apache.tika" name="tika-parsers" rev="0.10"/>
- -->
+ <dependency org="org.apache.tika" name="tika-core" rev="1.2" />
+ <dependency org="com.googlecode.juniversalchardet"
name="juniversalchardet" rev="1.0.3"/>
<dependency org="org.apache.gora" name="gora-core" rev="0.2.1"
conf="*->compile"/>
Modified: nutch/branches/2.x/src/plugin/parse-tika/ivy.xml
URL:
http://svn.apache.org/viewvc/nutch/branches/2.x/src/plugin/parse-tika/ivy.xml?rev=1400397&r1=1400396&r2=1400397&view=diff
==============================================================================
--- nutch/branches/2.x/src/plugin/parse-tika/ivy.xml (original)
+++ nutch/branches/2.x/src/plugin/parse-tika/ivy.xml Sat Oct 20 09:14:40 2012
@@ -36,7 +36,7 @@
</publications>
<dependencies>
- <dependency org="org.apache.tika" name="tika-parsers" rev="0.10"
conf="*->default">
+ <dependency org="org.apache.tika" name="tika-parsers" rev="1.2"
conf="*->default">
<exclude org="org.apache.tika" name="tika-core" />
</dependency>
</dependencies>
Modified: nutch/branches/2.x/src/plugin/parse-tika/plugin.xml
URL:
http://svn.apache.org/viewvc/nutch/branches/2.x/src/plugin/parse-tika/plugin.xml?rev=1400397&r1=1400396&r2=1400397&view=diff
==============================================================================
--- nutch/branches/2.x/src/plugin/parse-tika/plugin.xml (original)
+++ nutch/branches/2.x/src/plugin/parse-tika/plugin.xml Sat Oct 20 09:14:40 2012
@@ -26,33 +26,39 @@
<export name="*"/>
</library>
- <library name="apache-mime4j-core-0.7.jar"/>
- <library name="apache-mime4j-dom-0.7.jar"/>
+ <library name="apache-mime4j-core-0.7.2.jar"/>
+ <library name="apache-mime4j-dom-0.7.2.jar"/>
<library name="asm-3.1.jar"/>
+ <library name="aspectjrt-1.6.11.jar"/>
<library name="bcmail-jdk15-1.45.jar"/>
<library name="bcprov-jdk15-1.45.jar"/>
<library name="boilerpipe-1.1.0.jar"/>
- <library name="commons-codec-1.4.jar"/>
- <library name="commons-compress-1.1.jar"/>
- <library name="commons-httpclient-3.1.jar"/>
+ <library name="commons-codec-1.5.jar"/>
+ <library name="commons-compress-1.4.1.jar"/>
<library name="commons-logging-1.1.1.jar"/>
<library name="dom4j-1.6.1.jar"/>
- <library name="fontbox-1.6.0.jar"/>
+ <library name="fontbox-1.7.0.jar"/>
<library name="geronimo-stax-api_1.0_spec-1.0.1.jar"/>
+ <library name="isoparser-1.0-RC-1.jar"/>
<library name="jdom-1.0.jar"/>
- <library name="jempbox-1.6.0.jar"/>
+ <library name="jempbox-1.7.0.jar"/>
+ <library name="juniversalchardet-1.0.3.jar"/>
<library name="metadata-extractor-2.4.0-beta-1.jar"/>
<library name="netcdf-4.2-min.jar"/>
- <library name="pdfbox-1.6.0.jar"/>
- <library name="poi-3.8-beta4.jar"/>
- <library name="poi-ooxml-3.8-beta4.jar"/>
- <library name="poi-ooxml-schemas-3.8-beta4.jar"/>
- <library name="poi-scratchpad-3.8-beta4.jar"/>
+ <library name="parse-tika.jar"/>
+ <library name="pdfbox-1.7.0.jar"/>
+ <library name="poi-3.8.jar"/>
+ <library name="poi-ooxml-3.8.jar"/>
+ <library name="poi-ooxml-schemas-3.8.jar"/>
+ <library name="poi-scratchpad-3.8.jar"/>
<library name="rome-0.9.jar"/>
<library name="slf4j-api-1.5.6.jar"/>
<library name="tagsoup-1.2.1.jar"/>
- <library name="tika-parsers-0.10.jar"/>
+ <library name="tika-parsers-1.2.jar"/>
+ <library name="vorbis-java-core-0.1.jar"/>
+ <library name="vorbis-java-tika-0.1.jar"/>
<library name="xmlbeans-2.3.0.jar"/>
+ <library name="xz-1.0.jar"/>
</runtime>
<requires>