Repository: tika Updated Branches: refs/heads/master 1cfd250f8 -> 7b4f6fa6c
TIKA-2096 -- fix example of not including embedded docs Project: http://git-wip-us.apache.org/repos/asf/tika/repo Commit: http://git-wip-us.apache.org/repos/asf/tika/commit/7b4f6fa6 Tree: http://git-wip-us.apache.org/repos/asf/tika/tree/7b4f6fa6 Diff: http://git-wip-us.apache.org/repos/asf/tika/diff/7b4f6fa6 Branch: refs/heads/master Commit: 7b4f6fa6c76430dbc0eeb4e6654b59e3afc38185 Parents: 1cfd250 Author: tballison <[email protected]> Authored: Mon Nov 28 11:55:48 2016 -0500 Committer: tballison <[email protected]> Committed: Mon Nov 28 11:55:48 2016 -0500 ---------------------------------------------------------------------- .../main/java/org/apache/tika/example/ParsingExample.java | 9 ++++++--- 1 file changed, 6 insertions(+), 3 deletions(-) ---------------------------------------------------------------------- http://git-wip-us.apache.org/repos/asf/tika/blob/7b4f6fa6/tika-example/src/main/java/org/apache/tika/example/ParsingExample.java ---------------------------------------------------------------------- diff --git a/tika-example/src/main/java/org/apache/tika/example/ParsingExample.java b/tika-example/src/main/java/org/apache/tika/example/ParsingExample.java index 5b8a9f3..5e3201f 100644 --- a/tika-example/src/main/java/org/apache/tika/example/ParsingExample.java +++ b/tika-example/src/main/java/org/apache/tika/example/ParsingExample.java @@ -32,6 +32,7 @@ import org.apache.tika.io.TikaInputStream; import org.apache.tika.metadata.Metadata; import org.apache.tika.metadata.serialization.JsonMetadataList; import org.apache.tika.parser.AutoDetectParser; +import org.apache.tika.parser.EmptyParser; import org.apache.tika.parser.ParseContext; import org.apache.tika.parser.Parser; import org.apache.tika.parser.RecursiveParserWrapper; @@ -95,8 +96,8 @@ public class ParsingExample { /** * If you don't want content from embedded documents, send in - * a {@link org.apache.tika.parser.ParseContext} that does not contain a - * {@link Parser}. + * a {@link org.apache.tika.parser.ParseContext} that does contains a + * {@link EmptyParser}. * * @return The content of a file. */ @@ -104,8 +105,10 @@ public class ParsingExample { AutoDetectParser parser = new AutoDetectParser(); BodyContentHandler handler = new BodyContentHandler(); Metadata metadata = new Metadata(); + ParseContext parseContext = new ParseContext(); + parseContext.set(Parser.class, new EmptyParser()); try (InputStream stream = ParsingExample.class.getResourceAsStream("test_recursive_embedded.docx")) { - parser.parse(stream, handler, metadata, new ParseContext()); + parser.parse(stream, handler, metadata, parseContext); return handler.toString(); } }
