This is an automated email from the ASF dual-hosted git repository. tilman pushed a commit to branch TIKA-4622 in repository https://gitbox.apache.org/repos/asf/tika.git
commit e1f2d5949d6d26a9567826b42602f118bf6b5811 Author: Tilman Hausherr <[email protected]> AuthorDate: Wed Jan 14 13:44:07 2026 +0100 TIKA-4622: Add test for PDF annotations with no content Added a test for PDF annotations without content streams. --- .../src/test/java/org/apache/tika/parser/pdf/PDFParserTest.java | 9 ++++++++- 1 file changed, 8 insertions(+), 1 deletion(-) diff --git a/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/test/java/org/apache/tika/parser/pdf/PDFParserTest.java b/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/test/java/org/apache/tika/parser/pdf/PDFParserTest.java index 195da525ca..2d49e37c48 100644 --- a/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/test/java/org/apache/tika/parser/pdf/PDFParserTest.java +++ b/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/test/java/org/apache/tika/parser/pdf/PDFParserTest.java @@ -6,7 +6,7 @@ * (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * - * http://www.apache.org/licenses/LICENSE-2.0 + * http://www.apache.org/licenses-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, @@ -368,6 +368,13 @@ public class PDFParserTest extends TikaTest { assertContains("igalsh", r.xml); } + // TIKA-4622 / PDFBOX-6145 make sure that annotations aren't missed if no page content stream + @Test + public void testAnnotationNoContents() throws Exception { + XMLResult r = getXML("testPDFFileEmbInAnnotation_noContents.pdf"); + assertContains("Excel.xlsx", r.xml); + } + @Test public void testEmbeddedPDFs() throws Exception { List<Metadata> metadataList = getRecursiveMetadata("testPDFPackage.pdf");
