This is an automated email from the ASF dual-hosted git repository. tallison pushed a commit to branch TIKA-4630-on-main in repository https://gitbox.apache.org/repos/asf/tika.git
commit 0d98d5ddd70d265198db7f9ce9ee322842eb2612 Merge: 6709c4a660 1c078b499b Author: tallison <[email protected]> AuthorDate: Fri Jan 23 15:27:34 2026 -0500 Merge remote-tracking branch 'origin/main' into TIKA-4630-on-main docs/antora-playbook.yml | 66 +++++ docs/antora.yml | 24 ++ docs/assets/logos/asf-tika-logos.zip | Bin 0 -> 446228 bytes .../ROOT/examples/migration-full-example.json | 1 + docs/modules/ROOT/examples/pdf-parser-basic.json | 1 + docs/modules/ROOT/examples/pdf-parser-full.json | 1 + docs/modules/ROOT/examples/tesseract-basic.json | 1 + docs/modules/ROOT/examples/tesseract-full.json | 1 + docs/modules/ROOT/nav.adoc | 40 +++ docs/modules/ROOT/pages/advanced/index.adoc | 31 +++ docs/modules/ROOT/pages/advanced/robustness.adoc | 137 +++++++++++ docs/modules/ROOT/pages/advanced/spooling.adoc | 229 +++++++++++++++++ docs/modules/ROOT/pages/configuration/index.adoc | 40 +++ .../pages/configuration/parsers/pdf-parser.adoc | 43 ++++ .../parsers/tesseract-ocr-parser.adoc | 67 +++++ docs/modules/ROOT/pages/faq.adoc | 28 +++ docs/modules/ROOT/pages/index.adoc | 43 ++++ docs/modules/ROOT/pages/maintainers/index.adoc | 32 +++ .../pages/maintainers/release-guides/docker.adoc | 133 ++++++++++ .../pages/maintainers/release-guides/grpc.adoc | 32 +++ .../pages/maintainers/release-guides/helm.adoc | 138 +++++++++++ .../pages/maintainers/release-guides/index.adoc | 32 +++ .../pages/maintainers/release-guides/tika.adoc | 271 +++++++++++++++++++++ docs/modules/ROOT/pages/maintainers/site.adoc | 172 +++++++++++++ .../pages/migration-to-4x/design-notes-4x.adoc | 127 ++++++++++ docs/modules/ROOT/pages/migration-to-4x/index.adoc | 33 +++ .../pages/migration-to-4x/metadata-changes-4x.adoc | 121 +++++++++ .../migration-to-4x}/migrating-tika-server-4x.adoc | 2 +- .../pages/migration-to-4x/migrating-to-4x.adoc | 157 ++++++++++++ .../pages/migration-to-4x/serialization-4x.adoc | 101 ++++++++ docs/modules/ROOT/pages/pipes/index.adoc | 37 +++ docs/modules/ROOT/pages/roadmap.adoc | 96 ++++++++ docs/modules/ROOT/pages/security.adoc | 34 +++ docs/modules/ROOT/pages/using-tika/cli/index.adoc | 134 ++++++++++ docs/modules/ROOT/pages/using-tika/grpc/index.adoc | 32 +++ docs/modules/ROOT/pages/using-tika/index.adoc | 71 ++++++ .../pages/using-tika/java-api/getting-started.adoc | 130 ++++++++++ .../ROOT/pages/using-tika/java-api/index.adoc | 179 ++++++++++++++ .../ROOT/pages/using-tika/server/index.adoc | 42 ++++ docs/pom.xml | 30 +++ docs/supplemental-ui/css/search.css | 82 +++++++ docs/supplemental-ui/img/ASF_Tika-colour.png | Bin 0 -> 30720 bytes docs/supplemental-ui/img/ASF_Tika-colour.svg | 109 +++++++++ docs/supplemental-ui/js/search.js | 119 +++++++++ docs/supplemental-ui/partials/footer-content.hbs | 3 + docs/supplemental-ui/partials/footer-scripts.hbs | 1 + docs/supplemental-ui/partials/head-scripts.hbs | 1 + docs/supplemental-ui/partials/header-content.hbs | 29 +++ .../ParsingEmbeddedDocumentExtractor.java | 14 ++ .../java/org/apache/tika/parser/ParseRecord.java | 120 +++++++++ .../apache/tika/parser/RecursiveParserWrapper.java | 12 + .../sax/AbstractRecursiveParserWrapperHandler.java | 2 + .../tika/pipes/api/emitter/AbstractEmitter.java | 7 +- .../pipes/api/emitter/AbstractStreamEmitter.java | 7 +- .../apache/tika/pipes/api/emitter/EmitData.java | 6 +- tika-pipes/tika-pipes-core/pom.xml | 4 + .../org/apache/tika/pipes/core/PipesClient.java | 46 ++-- .../tika/pipes/core/emitter/EmitDataImpl.java | 32 +-- .../core/serialization/EmitDataDeserializer.java | 75 ++++++ .../core/serialization/EmitDataSerializer.java | 45 ++++ .../pipes/core/serialization/JsonPipesIpc.java | 88 +++++++ .../serialization/PipesResultDeserializer.java | 65 +++++ .../core/serialization/PipesResultSerializer.java | 46 ++++ .../tika/pipes/core/server/ParseHandler.java | 32 ++- .../apache/tika/pipes/core/server/PipesServer.java | 49 ++-- .../apache/tika/pipes/core/MockPassbackFilter.java | 52 ++++ .../apache/tika/pipes/core/PassbackFilterTest.java | 24 +- .../apache/tika/pipes/core/PipesClientTest.java | 24 +- .../tika/pipes/emitter/jdbc/JDBCEmitter.java | 6 +- tika-serialization/pom.xml | 5 + .../apache/tika/config/loader/FrameworkConfig.java | 11 +- .../config/loader/TikaObjectMapperFactory.java | 18 +- .../org/apache/tika/serialization/TikaModule.java | 8 +- .../serdes/ParseContextDeserializer.java | 15 +- .../serdes/ParseContextSerializer.java | 7 +- .../apache/tika/serialization/SmileFormatTest.java | 110 +++++++++ 76 files changed, 4032 insertions(+), 131 deletions(-)
