This is an automated email from the ASF dual-hosted git repository. tallison pushed a commit to branch master in repository https://gitbox.apache.org/repos/asf/nutch.git
The following commit(s) were added to refs/heads/master by this push: new f88b9a116 NUTCH-3019 -- update Tika (#797) f88b9a116 is described below commit f88b9a116d6be5eea738d99af65406bdd96fd6d0 Author: Tim Allison <talli...@apache.org> AuthorDate: Mon Nov 6 12:10:43 2023 -0500 NUTCH-3019 -- update Tika (#797) Update to Tika 2.9.1 --- ivy/ivy.xml | 14 ++++++++------ src/plugin/language-identifier/ivy.xml | 2 +- src/plugin/language-identifier/plugin.xml | 2 +- src/plugin/parse-tika/ivy.xml | 2 +- src/plugin/parse-tika/plugin.xml | 2 +- 5 files changed, 12 insertions(+), 10 deletions(-) diff --git a/ivy/ivy.xml b/ivy/ivy.xml index e5ae3882f..054cbcc1a 100644 --- a/ivy/ivy.xml +++ b/ivy/ivy.xml @@ -36,19 +36,21 @@ </publications> <dependencies> - <dependency org="org.apache.logging.log4j" name="log4j-api" rev="2.20.0" conf="*->master" /> - <dependency org="org.apache.logging.log4j" name="log4j-core" rev="2.20.0" conf="*->master" /> - <dependency org="org.apache.logging.log4j" name="log4j-slf4j2-impl" rev="2.20.0" conf="*->master" /> - <dependency org="org.slf4j" name="slf4j-api" rev="2.0.7" conf="*->master" /> + <dependency org="org.apache.logging.log4j" name="log4j-api" rev="2.21.1" conf="*->master" /> + <dependency org="org.apache.logging.log4j" name="log4j-core" rev="2.21.1" conf="*->master" /> + <dependency org="org.apache.logging.log4j" name="log4j-slf4j2-impl" rev="2.21.1" conf="*->master" /> + <dependency org="org.slf4j" name="slf4j-api" rev="2.0.9" conf="*->master" /> <dependency org="org.apache.commons" name="commons-lang3" rev="3.13.0" conf="*->default" /> <dependency org="org.apache.commons" name="commons-collections4" rev="4.4" conf="*->master" /> <dependency org="org.apache.httpcomponents" name="httpclient" rev="4.5.13" conf="*->master" /> <dependency org="commons-codec" name="commons-codec" rev="1.16.0" conf="*->default" /> <!-- hadoop 3.4.0 should have 2.11.0; Tika is broken in distributed mode until then; + We're currently relying on the hadoop-safe-tika shim that shades commons-io to upgrade + Tika see https://github.com/apache/nutch/pull/776 --> <dependency org="commons-io" name="commons-io" rev="2.11.0" conf="*->default" /> - <dependency org="org.apache.commons" name="commons-compress" rev="1.23.0" conf="*->default" /> + <dependency org="org.apache.commons" name="commons-compress" rev="1.24.0" conf="*->default" /> <dependency org="org.apache.commons" name="commons-jexl3" rev="3.2.1" conf="*->default" /> <dependency org="com.tdunning" name="t-digest" rev="3.3" /> @@ -70,7 +72,7 @@ <exclude org="org.slf4j" name="*" /> </dependency><!-- End of Hadoop Dependencies --> - <dependency org="org.tallison.tika" name="tika-core-shaded" rev="2.9.0.0" conf="*->default" transitive="false"/> + <dependency org="org.tallison.tika" name="tika-core-shaded" rev="2.9.1.0" conf="*->default" transitive="false"/> <dependency org="xml-apis" name="xml-apis" rev="1.4.01" /><!-- force this version as it is required by Tika --> <dependency org="xerces" name="xercesImpl" rev="2.12.2" /> diff --git a/src/plugin/language-identifier/ivy.xml b/src/plugin/language-identifier/ivy.xml index f64b97055..e22284c03 100644 --- a/src/plugin/language-identifier/ivy.xml +++ b/src/plugin/language-identifier/ivy.xml @@ -35,7 +35,7 @@ </publications> <dependencies> - <dependency org="org.tallison.tika" name="tika-langdetect-optimaize-shaded" rev="2.9.0.0" conf="*->default" transitive="false"/> + <dependency org="org.tallison.tika" name="tika-langdetect-optimaize-shaded" rev="2.9.1.0" conf="*->default" transitive="false"/> </dependencies> </ivy-module> diff --git a/src/plugin/language-identifier/plugin.xml b/src/plugin/language-identifier/plugin.xml index dab1a52f3..94929bdbf 100644 --- a/src/plugin/language-identifier/plugin.xml +++ b/src/plugin/language-identifier/plugin.xml @@ -26,7 +26,7 @@ <export name="*"/> </library> <!-- dependencies of Tika's Optimaize language detector (tika-langdetect-optimaize) --> - <library name="tika-langdetect-optimaize-shaded-2.9.0.0.jar"/> + <library name="tika-langdetect-optimaize-shaded-2.9.1.0.jar"/> </runtime> <requires> diff --git a/src/plugin/parse-tika/ivy.xml b/src/plugin/parse-tika/ivy.xml index b89e812e1..8008e3244 100644 --- a/src/plugin/parse-tika/ivy.xml +++ b/src/plugin/parse-tika/ivy.xml @@ -35,7 +35,7 @@ </publications> <dependencies> - <dependency org="org.tallison.tika" name="tika-parsers-standard-package-shaded" rev="2.9.0.0" conf="*->default" transitive="false"/> + <dependency org="org.tallison.tika" name="tika-parsers-standard-package-shaded" rev="2.9.1.0" conf="*->default" transitive="false"/> </dependencies> </ivy-module> diff --git a/src/plugin/parse-tika/plugin.xml b/src/plugin/parse-tika/plugin.xml index dd4fe7fde..04afb9fac 100644 --- a/src/plugin/parse-tika/plugin.xml +++ b/src/plugin/parse-tika/plugin.xml @@ -25,7 +25,7 @@ <library name="parse-tika.jar"> <export name="*"/> </library> - <library name="tika-parsers-standard-package-shaded-2.9.0.0.jar"/> + <library name="tika-parsers-standard-package-shaded-2.9.1.0.jar"/> </runtime> <requires>