[ 
https://issues.apache.org/jira/browse/NUTCH-2667?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&focusedCommentId=16662236#comment-16662236
 ] 

ASF GitHub Bot commented on NUTCH-2667:
---------------------------------------

sebastian-nagel commented on a change in pull request #403: NUTCH-2667 Update 
Tika and Commons Collections 4
URL: https://github.com/apache/nutch/pull/403#discussion_r227680767
 
 

 ##########
 File path: src/plugin/parse-tika/plugin.xml
 ##########
 @@ -25,87 +25,108 @@
       <library name="parse-tika.jar">
          <export name="*"/>
       </library>
-
-       <library name="apache-mime4j-core-0.7.2.jar"/>
-       <library name="apache-mime4j-dom-0.7.2.jar"/>
-       <library name="asm-debug-all-4.1.jar"/>
-       <library name="aspectjrt-1.8.0.jar"/>
-       <library name="bcmail-jdk15on-1.52.jar"/>
-       <library name="bcpkix-jdk15on-1.52.jar"/>
-       <library name="bcprov-jdk15on-1.52.jar"/>
-       <library name="boilerpipe-1.1.0.jar"/>
-       <library name="bzip2-0.9.1.jar"/>
-       <library name="c3p0-0.9.1.1.jar"/>
-       <library name="cdm-4.5.5.jar"/>
-       <library name="commons-codec-1.6.jar"/>
-       <library name="commons-compress-1.9.jar"/>
-       <library name="commons-csv-1.0.jar"/>
-       <library name="commons-exec-1.3.jar"/>
-       <library name="commons-io-2.4.jar"/>
-       <library name="commons-lang-2.6.jar"/>
-       <library name="commons-logging-1.1.3.jar"/>
-       <library name="commons-logging-api-1.1.jar"/>
-       <library name="commons-vfs2-2.0.jar"/>
-       <library name="ehcache-core-2.6.2.jar"/>
-       <library name="fontbox-1.8.10.jar"/>
-       <library name="geoapi-3.0.0.jar"/>
-       <library name="grib-4.5.5.jar"/>
-       <library name="guava-11.0.2.jar"/>
-       <library name="httpclient-4.2.6.jar"/>
-       <library name="httpcore-4.2.5.jar"/>
-       <library name="httpmime-4.2.6.jar"/>
-       <library name="httpservices-4.5.5.jar"/>
-       <library name="isoparser-1.0.2.jar"/>
-       <library name="jackcess-2.1.2.jar"/>
-       <library name="jackcess-encrypt-2.1.0.jar"/>
-       <library name="java-libpst-0.8.1.jar"/>
-       <library name="jcip-annotations-1.0.jar"/>
-       <library name="jcommander-1.35.jar"/>
-       <library name="jdom-1.0.jar"/>
-       <library name="jdom2-2.0.4.jar"/>
-       <library name="jempbox-1.8.10.jar"/>
-       <library name="jhighlight-1.0.2.jar"/>
-       <library name="jj2000-5.2.jar"/>
-       <library name="jmatio-1.0.jar"/>
-       <library name="jna-4.1.0.jar"/>
-       <library name="joda-time-2.2.jar"/>
-       <library name="json-simple-1.1.1.jar"/>
-       <library name="jsoup-1.7.2.jar"/>
-       <library name="jsr-275-0.9.3.jar"/>
-       <library name="jsr305-1.3.9.jar"/>
-       <library name="juniversalchardet-1.0.3.jar"/>
-       <library name="junrar-0.7.jar"/>
-       <library name="jwnl-1.3.3.jar"/>
-       <library name="maven-scm-api-1.4.jar"/>
-       <library name="maven-scm-provider-svn-commons-1.4.jar"/>
-       <library name="maven-scm-provider-svnexe-1.4.jar"/>
-       <library name="metadata-extractor-2.8.0.jar"/>
-       <library name="netcdf4-4.5.5.jar"/>
-       <library name="opennlp-maxent-3.0.3.jar"/>
-       <library name="opennlp-tools-1.5.3.jar"/>
-       <library name="pdfbox-1.8.10.jar"/>
-       <library name="plexus-utils-1.5.6.jar"/>
-       <library name="poi-3.13-beta1.jar"/>
-       <library name="poi-ooxml-3.13-beta1.jar"/>
-       <library name="poi-ooxml-schemas-3.13-beta1.jar"/>
-       <library name="poi-scratchpad-3.13-beta1.jar"/>
-       <library name="protobuf-java-2.5.0.jar"/>
-       <library name="quartz-2.2.0.jar"/>
-       <library name="regexp-1.3.jar"/>
-       <library name="rome-0.9.jar"/>
-       <library name="sis-metadata-0.5.jar"/>
-       <library name="sis-netcdf-0.5.jar"/>
-       <library name="sis-referencing-0.5.jar"/>
-       <library name="sis-storage-0.5.jar"/>
-       <library name="sis-utility-0.5.jar"/>
-       <library name="tagsoup-1.2.1.jar"/>
-       <library name="tika-parsers-1.10.jar"/>
-       <library name="udunits-4.5.5.jar"/>
-       <library name="vorbis-java-core-0.6.jar"/>
-       <library name="vorbis-java-tika-0.6.jar"/>
-       <library name="xmlbeans-2.6.0.jar"/>
-       <library name="xmpcore-5.1.2.jar"/>
-       <library name="xz-1.5.jar"/>
+      <!-- dependencies of Tika (tika-parsers) -->
+      <library name="FastInfoset-1.2.13.jar"/>
+      <library name="activation-1.1.1.jar"/>
+      <library name="apache-mime4j-core-0.8.2.jar"/>
+      <library name="apache-mime4j-dom-0.8.2.jar"/>
+      <library name="asm-6.2.jar"/>
+      <library name="bcmail-jdk15on-1.60.jar"/>
+      <library name="bcpkix-jdk15on-1.60.jar"/>
+      <library name="bcprov-jdk15on-1.60.jar"/>
+      <library name="boilerpipe-1.1.0.jar"/>
+      <library name="bzip2-0.9.1.jar"/>
+      <library name="c3p0-0.9.1.1.jar"/>
+      <library name="cdm-4.5.5.jar"/>
+      <library name="commons-codec-1.10.jar"/>
 
 Review comment:
   Why there are multiple libraries of commons-codec (1.6 and 1.10)? Tika 
1.19.1 depends on 1.11 but the "downgrade" to 1.10 could be caused by the 
exclusions in src/plugin/parse-tika/ivy.xml.

----------------------------------------------------------------
This is an automated message from the Apache Git Service.
To respond to the message, please log on GitHub and use the
URL above to go to the specific comment.
 
For queries about this service, please contact Infrastructure at:
[email protected]


> Update Tika and Commons Collections 4
> -------------------------------------
>
>                 Key: NUTCH-2667
>                 URL: https://issues.apache.org/jira/browse/NUTCH-2667
>             Project: Nutch
>          Issue Type: Improvement
>          Components: build
>    Affects Versions: 2.4
>            Reporter: Lewis John McGibbney
>            Assignee: Lewis John McGibbney
>            Priority: Blocker
>             Fix For: 2.4
>
>
> Tika and Commons Collections 4 need to be updated. This issue needs to 
> address them.



--
This message was sent by Atlassian JIRA
(v7.6.3#76005)

Reply via email to