This is an automated email from the ASF dual-hosted git repository. tallison pushed a commit to branch TIKA-4490 in repository https://gitbox.apache.org/repos/asf/tika.git
commit 14c3d2caf75248009bb446159ec729f8601e14bd Author: tallison <[email protected]> AuthorDate: Thu Sep 25 15:53:47 2025 -0400 Small fixes found during ossfuzz integration --- .../org/apache/tika/detect/microsoft/ooxml/OPCPackageDetector.java | 4 ++++ .../main/java/org/apache/tika/parser/microsoft/ExcelExtractor.java | 3 +++ 2 files changed, 7 insertions(+) diff --git a/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-microsoft-module/src/main/java/org/apache/tika/detect/microsoft/ooxml/OPCPackageDetector.java b/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-microsoft-module/src/main/java/org/apache/tika/detect/microsoft/ooxml/OPCPackageDetector.java index 341e9755b..28db84e09 100644 --- a/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-microsoft-module/src/main/java/org/apache/tika/detect/microsoft/ooxml/OPCPackageDetector.java +++ b/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-microsoft-module/src/main/java/org/apache/tika/detect/microsoft/ooxml/OPCPackageDetector.java @@ -198,6 +198,10 @@ public class OPCPackageDetector implements ZipContainerDetector { // Get the type of the core document part PackagePart corePart = pkg.getPart(core.getRelationship(0)); + if (corePart == null) { + return null; + } + String coreType = corePart.getContentType(); if (coreType.contains(".xps")) { diff --git a/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-microsoft-module/src/main/java/org/apache/tika/parser/microsoft/ExcelExtractor.java b/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-microsoft-module/src/main/java/org/apache/tika/parser/microsoft/ExcelExtractor.java index 41a1a840e..1604b5aab 100644 --- a/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-microsoft-module/src/main/java/org/apache/tika/parser/microsoft/ExcelExtractor.java +++ b/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-microsoft-module/src/main/java/org/apache/tika/parser/microsoft/ExcelExtractor.java @@ -508,6 +508,9 @@ public class ExcelExtractor extends AbstractPOIFSExtractor { break; case LabelSSTRecord.sid: // Ref. a string in the shared string table + if (sstRecord == null) { + throw new TikaException("sstRecord should have been initialized before a ref to the shared string table"); + } LabelSSTRecord sst = (LabelSSTRecord) record; UnicodeString unicode = sstRecord.getString(sst.getSSTIndex()); String cellString = null;
