Just tried the latest 2.X after being away for a while. Tika parsing doesn't
seem to be working.
Exception in thread "main" java.lang.NoSuchMethodError:
org.apache.tika.mime.MediaType.set([Lorg/apache/tika/mime/MediaType;)Ljava/util/Set;
at
org.apache.tika.parser.crypto.Pkcs7Parser.getSupportedTypes(Pkcs7Parser.java:52)
at org.apache.nutch.parse.tika.TikaConfig.<init>(TikaConfig.java:149)
at
org.apache.nutch.parse.tika.TikaConfig.getDefaultConfig(TikaConfig.java:210)
at org.apache.nutch.parse.tika.TikaParser.setConf(TikaParser.java:203)
at
org.apache.nutch.plugin.Extension.getExtensionInstance(Extension.java:162)
at org.apache.nutch.parse.ParserFactory.getFields(ParserFactory.java:209)
at org.apache.nutch.parse.ParserJob.getFields(ParserJob.java:193)
at org.apache.nutch.fetcher.FetcherJob.getFields(FetcherJob.java:142)
at org.apache.nutch.fetcher.FetcherJob.run(FetcherJob.java:184)
at org.apache.nutch.fetcher.FetcherJob.fetch(FetcherJob.java:219)
at org.apache.nutch.fetcher.FetcherJob.run(FetcherJob.java:301)
at org.apache.hadoop.util.ToolRunner.run(ToolRunner.java:65)
at org.apache.nutch.fetcher.FetcherJob.main(FetcherJob.java:307)
Exception in thread "main" java.lang.NoSuchMethodError:
org.apache.tika.mime.MediaType.set([Lorg/apache/tika/mime/MediaType;)Ljava/util/Set;
at
org.apache.tika.parser.crypto.Pkcs7Parser.getSupportedTypes(Pkcs7Parser.java:52)
at org.apache.nutch.parse.tika.TikaConfig.<init>(TikaConfig.java:149)
at
org.apache.nutch.parse.tika.TikaConfig.getDefaultConfig(TikaConfig.java:210)
at org.apache.nutch.parse.tika.TikaParser.setConf(TikaParser.java:203)
at
org.apache.nutch.plugin.Extension.getExtensionInstance(Extension.java:162)
at org.apache.nutch.parse.ParserFactory.getFields(ParserFactory.java:209)
at org.apache.nutch.parse.ParserJob.getFields(ParserJob.java:193)
at org.apache.nutch.parse.ParserJob.run(ParserJob.java:245)
at org.apache.nutch.parse.ParserJob.parse(ParserJob.java:259)
at org.apache.nutch.parse.ParserJob.run(ParserJob.java:302)
at org.apache.hadoop.util.ToolRunner.run(ToolRunner.java:65)
at org.apache.nutch.parse.ParserJob.main(ParserJob.java:306)