This is an automated email from the ASF dual-hosted git repository.
tilman pushed a commit to branch branch_2x
in repository https://gitbox.apache.org/repos/asf/tika.git
The following commit(s) were added to refs/heads/branch_2x by this push:
new 8e479908a TIKA-4311: refactor / simplify
8e479908a is described below
commit 8e479908a4f6efb18b54362160dc12119e4262fd
Author: Tilman Hausherr <[email protected]>
AuthorDate: Tue Sep 17 20:21:02 2024 +0200
TIKA-4311: refactor / simplify
---
.../java/org/apache/tika/parser/pdf/PDFMarkedContent2XHTML.java | 7 +++----
1 file changed, 3 insertions(+), 4 deletions(-)
diff --git
a/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/main/java/org/apache/tika/parser/pdf/PDFMarkedContent2XHTML.java
b/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/main/java/org/apache/tika/parser/pdf/PDFMarkedContent2XHTML.java
index d5495f7f2..b745fea02 100644
---
a/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/main/java/org/apache/tika/parser/pdf/PDFMarkedContent2XHTML.java
+++
b/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/main/java/org/apache/tika/parser/pdf/PDFMarkedContent2XHTML.java
@@ -178,14 +178,13 @@ public class PDFMarkedContent2XHTML extends PDF2XHTML {
COSBase kidbase = ((COSObject) kid).getObject();
if (kidbase instanceof COSDictionary) {
COSDictionary dict = (COSDictionary) kidbase;
- if (dict.containsKey(COSName.TYPE) &&
-
COSName.PAGE.equals(dict.getCOSName(COSName.TYPE))) {
+ if
(COSName.PAGE.equals(dict.getCOSName(COSName.TYPE))) {
pageRefs.add(new ObjectRef(((COSObject)
kid).getObjectNumber(),
((COSObject) kid).getGenerationNumber()));
continue;
}
- if (((COSDictionary)
kidbase).containsKey(COSName.KIDS)) {
- findPages(((COSDictionary)
kidbase).getDictionaryObject(COSName.KIDS), pageRefs);
+ if (dict.containsKey(COSName.KIDS)) {
+ findPages(dict.getDictionaryObject(COSName.KIDS),
pageRefs);
}
}
}