[ 
https://issues.apache.org/jira/browse/NUTCH-2667?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&focusedCommentId=16662235#comment-16662235
 ] 

ASF GitHub Bot commented on NUTCH-2667:
---------------------------------------

sebastian-nagel commented on a change in pull request #403: NUTCH-2667 Update 
Tika and Commons Collections 4
URL: https://github.com/apache/nutch/pull/403#discussion_r227682607
 
 

 ##########
 File path: src/plugin/parse-tika/plugin.xml
 ##########
 @@ -25,87 +25,108 @@
       <library name="parse-tika.jar">
          <export name="*"/>
       </library>
-
-       <library name="apache-mime4j-core-0.7.2.jar"/>
-       <library name="apache-mime4j-dom-0.7.2.jar"/>
-       <library name="asm-debug-all-4.1.jar"/>
-       <library name="aspectjrt-1.8.0.jar"/>
-       <library name="bcmail-jdk15on-1.52.jar"/>
-       <library name="bcpkix-jdk15on-1.52.jar"/>
-       <library name="bcprov-jdk15on-1.52.jar"/>
-       <library name="boilerpipe-1.1.0.jar"/>
-       <library name="bzip2-0.9.1.jar"/>
-       <library name="c3p0-0.9.1.1.jar"/>
-       <library name="cdm-4.5.5.jar"/>
-       <library name="commons-codec-1.6.jar"/>
-       <library name="commons-compress-1.9.jar"/>
-       <library name="commons-csv-1.0.jar"/>
-       <library name="commons-exec-1.3.jar"/>
-       <library name="commons-io-2.4.jar"/>
-       <library name="commons-lang-2.6.jar"/>
-       <library name="commons-logging-1.1.3.jar"/>
-       <library name="commons-logging-api-1.1.jar"/>
-       <library name="commons-vfs2-2.0.jar"/>
-       <library name="ehcache-core-2.6.2.jar"/>
-       <library name="fontbox-1.8.10.jar"/>
-       <library name="geoapi-3.0.0.jar"/>
-       <library name="grib-4.5.5.jar"/>
-       <library name="guava-11.0.2.jar"/>
-       <library name="httpclient-4.2.6.jar"/>
-       <library name="httpcore-4.2.5.jar"/>
-       <library name="httpmime-4.2.6.jar"/>
-       <library name="httpservices-4.5.5.jar"/>
-       <library name="isoparser-1.0.2.jar"/>
-       <library name="jackcess-2.1.2.jar"/>
-       <library name="jackcess-encrypt-2.1.0.jar"/>
-       <library name="java-libpst-0.8.1.jar"/>
-       <library name="jcip-annotations-1.0.jar"/>
-       <library name="jcommander-1.35.jar"/>
-       <library name="jdom-1.0.jar"/>
-       <library name="jdom2-2.0.4.jar"/>
-       <library name="jempbox-1.8.10.jar"/>
-       <library name="jhighlight-1.0.2.jar"/>
-       <library name="jj2000-5.2.jar"/>
-       <library name="jmatio-1.0.jar"/>
-       <library name="jna-4.1.0.jar"/>
-       <library name="joda-time-2.2.jar"/>
-       <library name="json-simple-1.1.1.jar"/>
-       <library name="jsoup-1.7.2.jar"/>
-       <library name="jsr-275-0.9.3.jar"/>
-       <library name="jsr305-1.3.9.jar"/>
-       <library name="juniversalchardet-1.0.3.jar"/>
-       <library name="junrar-0.7.jar"/>
-       <library name="jwnl-1.3.3.jar"/>
-       <library name="maven-scm-api-1.4.jar"/>
-       <library name="maven-scm-provider-svn-commons-1.4.jar"/>
-       <library name="maven-scm-provider-svnexe-1.4.jar"/>
-       <library name="metadata-extractor-2.8.0.jar"/>
-       <library name="netcdf4-4.5.5.jar"/>
-       <library name="opennlp-maxent-3.0.3.jar"/>
-       <library name="opennlp-tools-1.5.3.jar"/>
-       <library name="pdfbox-1.8.10.jar"/>
-       <library name="plexus-utils-1.5.6.jar"/>
-       <library name="poi-3.13-beta1.jar"/>
-       <library name="poi-ooxml-3.13-beta1.jar"/>
-       <library name="poi-ooxml-schemas-3.13-beta1.jar"/>
-       <library name="poi-scratchpad-3.13-beta1.jar"/>
-       <library name="protobuf-java-2.5.0.jar"/>
-       <library name="quartz-2.2.0.jar"/>
-       <library name="regexp-1.3.jar"/>
-       <library name="rome-0.9.jar"/>
-       <library name="sis-metadata-0.5.jar"/>
-       <library name="sis-netcdf-0.5.jar"/>
-       <library name="sis-referencing-0.5.jar"/>
-       <library name="sis-storage-0.5.jar"/>
-       <library name="sis-utility-0.5.jar"/>
-       <library name="tagsoup-1.2.1.jar"/>
-       <library name="tika-parsers-1.10.jar"/>
-       <library name="udunits-4.5.5.jar"/>
-       <library name="vorbis-java-core-0.6.jar"/>
-       <library name="vorbis-java-tika-0.6.jar"/>
-       <library name="xmlbeans-2.6.0.jar"/>
-       <library name="xmpcore-5.1.2.jar"/>
-       <library name="xz-1.5.jar"/>
+      <!-- dependencies of Tika (tika-parsers) -->
+      <library name="FastInfoset-1.2.13.jar"/>
+      <library name="activation-1.1.1.jar"/>
+      <library name="apache-mime4j-core-0.8.2.jar"/>
+      <library name="apache-mime4j-dom-0.8.2.jar"/>
+      <library name="asm-6.2.jar"/>
+      <library name="bcmail-jdk15on-1.60.jar"/>
+      <library name="bcpkix-jdk15on-1.60.jar"/>
+      <library name="bcprov-jdk15on-1.60.jar"/>
+      <library name="boilerpipe-1.1.0.jar"/>
+      <library name="bzip2-0.9.1.jar"/>
+      <library name="c3p0-0.9.1.1.jar"/>
+      <library name="cdm-4.5.5.jar"/>
+      <library name="commons-codec-1.10.jar"/>
 
 Review comment:
   @lewismc, was this caused by an existing and non-empty folder 
src/plugin/parse-tika/lib/? But we should add `rm lib/*` as a necessary step in 
howto_upgrade_tika.txt anyway.

----------------------------------------------------------------
This is an automated message from the Apache Git Service.
To respond to the message, please log on GitHub and use the
URL above to go to the specific comment.
 
For queries about this service, please contact Infrastructure at:
us...@infra.apache.org


> Update Tika and Commons Collections 4
> -------------------------------------
>
>                 Key: NUTCH-2667
>                 URL: https://issues.apache.org/jira/browse/NUTCH-2667
>             Project: Nutch
>          Issue Type: Improvement
>          Components: build
>    Affects Versions: 2.4
>            Reporter: Lewis John McGibbney
>            Assignee: Lewis John McGibbney
>            Priority: Blocker
>             Fix For: 2.4
>
>
> Tika and Commons Collections 4 need to be updated. This issue needs to 
> address them.



--
This message was sent by Atlassian JIRA
(v7.6.3#76005)

Reply via email to