This is an automated email from the ASF dual-hosted git repository. tallison pushed a commit to branch TIKA-4567 in repository https://gitbox.apache.org/repos/asf/tika.git
commit c18316141cbf680a1de72b407fac0a59b8822e8e Author: tallison <[email protected]> AuthorDate: Thu Dec 11 11:34:47 2025 -0500 TIKA-4567 -- further tweaks --- .../src/main/java/org/apache/tika/parser/pdf/OcrConfig.java | 10 +++++++--- .../main/java/org/apache/tika/parser/pdf/PDFParserConfig.java | 8 +++++--- 2 files changed, 12 insertions(+), 6 deletions(-) diff --git a/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/main/java/org/apache/tika/parser/pdf/OcrConfig.java b/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/main/java/org/apache/tika/parser/pdf/OcrConfig.java index 97bd59e5a6..6884339da4 100644 --- a/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/main/java/org/apache/tika/parser/pdf/OcrConfig.java +++ b/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/main/java/org/apache/tika/parser/pdf/OcrConfig.java @@ -179,11 +179,15 @@ public class OcrConfig implements Serializable { } /** - * No-op setter for Jackson deserialization compatibility. - * The format name is derived from {@link #setImageFormat(ImageFormat)}. + * Sets the image format by name (e.g., "png", "tiff", "jpeg"). + * This is a convenience setter for JSON configuration. + * + * @param imageFormatName the format name (case-insensitive) */ public void setImageFormatName(String imageFormatName) { - // Ignored - use setImageFormat instead + if (imageFormatName != null) { + this.imageFormat = ImageFormat.valueOf(imageFormatName.toUpperCase(Locale.ROOT)); + } } public float getImageQuality() { diff --git a/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/main/java/org/apache/tika/parser/pdf/PDFParserConfig.java b/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/main/java/org/apache/tika/parser/pdf/PDFParserConfig.java index 584b59c513..2ff3607cd8 100644 --- a/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/main/java/org/apache/tika/parser/pdf/PDFParserConfig.java +++ b/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/main/java/org/apache/tika/parser/pdf/PDFParserConfig.java @@ -568,11 +568,13 @@ public class PDFParserConfig implements Serializable { } /** - * No-op setter for Jackson deserialization compatibility. - * Use {@link #setOcrImageFormat(OcrConfig.ImageFormat)} instead. + * Sets the OCR image format by name (e.g., "png", "tiff", "jpeg"). + * This is a convenience setter for JSON configuration. + * + * @param ocrImageFormatName the format name (case-insensitive) */ public void setOcrImageFormatName(String ocrImageFormatName) { - // Ignored - use setOcrImageFormat instead + ocr.setImageFormatName(ocrImageFormatName); } public OcrConfig.ImageFormat getOcrImageFormat() {
