This is an automated email from the ASF dual-hosted git repository.
tallison pushed a commit to branch master
in repository https://gitbox.apache.org/repos/asf/nutch.git
The following commit(s) were added to refs/heads/master by this push:
new f88b9a116 NUTCH-3019 -- update Tika (#797)
f88b9a116 is described below
commit f88b9a116d6be5eea738d99af65406bdd96fd6d0
Author: Tim Allison <[email protected]>
AuthorDate: Mon Nov 6 12:10:43 2023 -0500
NUTCH-3019 -- update Tika (#797)
Update to Tika 2.9.1
---
ivy/ivy.xml | 14 ++++++++------
src/plugin/language-identifier/ivy.xml | 2 +-
src/plugin/language-identifier/plugin.xml | 2 +-
src/plugin/parse-tika/ivy.xml | 2 +-
src/plugin/parse-tika/plugin.xml | 2 +-
5 files changed, 12 insertions(+), 10 deletions(-)
diff --git a/ivy/ivy.xml b/ivy/ivy.xml
index e5ae3882f..054cbcc1a 100644
--- a/ivy/ivy.xml
+++ b/ivy/ivy.xml
@@ -36,19 +36,21 @@
</publications>
<dependencies>
- <dependency org="org.apache.logging.log4j" name="log4j-api"
rev="2.20.0" conf="*->master" />
- <dependency org="org.apache.logging.log4j" name="log4j-core" rev="2.20.0"
conf="*->master" />
- <dependency org="org.apache.logging.log4j"
name="log4j-slf4j2-impl" rev="2.20.0" conf="*->master" />
- <dependency org="org.slf4j" name="slf4j-api" rev="2.0.7"
conf="*->master" />
+ <dependency org="org.apache.logging.log4j" name="log4j-api"
rev="2.21.1" conf="*->master" />
+ <dependency org="org.apache.logging.log4j" name="log4j-core" rev="2.21.1"
conf="*->master" />
+ <dependency org="org.apache.logging.log4j"
name="log4j-slf4j2-impl" rev="2.21.1" conf="*->master" />
+ <dependency org="org.slf4j" name="slf4j-api" rev="2.0.9"
conf="*->master" />
<dependency org="org.apache.commons" name="commons-lang3"
rev="3.13.0" conf="*->default" />
<dependency org="org.apache.commons"
name="commons-collections4" rev="4.4" conf="*->master" />
<dependency org="org.apache.httpcomponents" name="httpclient"
rev="4.5.13" conf="*->master" />
<dependency org="commons-codec" name="commons-codec"
rev="1.16.0" conf="*->default" />
<!-- hadoop 3.4.0 should have 2.11.0; Tika is broken in
distributed mode until then;
+ We're currently relying on the hadoop-safe-tika
shim that shades commons-io to upgrade
+ Tika
see https://github.com/apache/nutch/pull/776 -->
<dependency org="commons-io" name="commons-io" rev="2.11.0"
conf="*->default" />
- <dependency org="org.apache.commons" name="commons-compress"
rev="1.23.0" conf="*->default" />
+ <dependency org="org.apache.commons" name="commons-compress"
rev="1.24.0" conf="*->default" />
<dependency org="org.apache.commons" name="commons-jexl3"
rev="3.2.1" conf="*->default" />
<dependency org="com.tdunning" name="t-digest" rev="3.3" />
@@ -70,7 +72,7 @@
<exclude org="org.slf4j" name="*" />
</dependency><!-- End of Hadoop Dependencies -->
- <dependency org="org.tallison.tika" name="tika-core-shaded"
rev="2.9.0.0" conf="*->default" transitive="false"/>
+ <dependency org="org.tallison.tika" name="tika-core-shaded"
rev="2.9.1.0" conf="*->default" transitive="false"/>
<dependency org="xml-apis" name="xml-apis" rev="1.4.01" /><!--
force this version as it is required by Tika -->
<dependency org="xerces" name="xercesImpl" rev="2.12.2" />
diff --git a/src/plugin/language-identifier/ivy.xml
b/src/plugin/language-identifier/ivy.xml
index f64b97055..e22284c03 100644
--- a/src/plugin/language-identifier/ivy.xml
+++ b/src/plugin/language-identifier/ivy.xml
@@ -35,7 +35,7 @@
</publications>
<dependencies>
- <dependency org="org.tallison.tika"
name="tika-langdetect-optimaize-shaded" rev="2.9.0.0" conf="*->default"
transitive="false"/>
+ <dependency org="org.tallison.tika"
name="tika-langdetect-optimaize-shaded" rev="2.9.1.0" conf="*->default"
transitive="false"/>
</dependencies>
</ivy-module>
diff --git a/src/plugin/language-identifier/plugin.xml
b/src/plugin/language-identifier/plugin.xml
index dab1a52f3..94929bdbf 100644
--- a/src/plugin/language-identifier/plugin.xml
+++ b/src/plugin/language-identifier/plugin.xml
@@ -26,7 +26,7 @@
<export name="*"/>
</library>
<!-- dependencies of Tika's Optimaize language detector
(tika-langdetect-optimaize) -->
- <library name="tika-langdetect-optimaize-shaded-2.9.0.0.jar"/>
+ <library name="tika-langdetect-optimaize-shaded-2.9.1.0.jar"/>
</runtime>
<requires>
diff --git a/src/plugin/parse-tika/ivy.xml b/src/plugin/parse-tika/ivy.xml
index b89e812e1..8008e3244 100644
--- a/src/plugin/parse-tika/ivy.xml
+++ b/src/plugin/parse-tika/ivy.xml
@@ -35,7 +35,7 @@
</publications>
<dependencies>
- <dependency org="org.tallison.tika"
name="tika-parsers-standard-package-shaded" rev="2.9.0.0" conf="*->default"
transitive="false"/>
+ <dependency org="org.tallison.tika"
name="tika-parsers-standard-package-shaded" rev="2.9.1.0" conf="*->default"
transitive="false"/>
</dependencies>
</ivy-module>
diff --git a/src/plugin/parse-tika/plugin.xml b/src/plugin/parse-tika/plugin.xml
index dd4fe7fde..04afb9fac 100644
--- a/src/plugin/parse-tika/plugin.xml
+++ b/src/plugin/parse-tika/plugin.xml
@@ -25,7 +25,7 @@
<library name="parse-tika.jar">
<export name="*"/>
</library>
- <library name="tika-parsers-standard-package-shaded-2.9.0.0.jar"/>
+ <library name="tika-parsers-standard-package-shaded-2.9.1.0.jar"/>
</runtime>
<requires>