This is an automated email from the ASF dual-hosted git repository.
tallison pushed a change to branch main
in repository https://gitbox.apache.org/repos/asf/tika.git.
from 23329a6 TIKA-3129 -- add a status endpoint to report server status.
Users must turn it on via the commandline -status option.
add 3bdcd97 TIKA-3137 -- first pass, need to add unit tests for tika-batch
add 78e5b9a TIKA-3140 -- initial commit
add eb6e07e TIKA-3137 add a list type for Param/configuration to avoid
the comma-delimited lists which will get huge and ugly and were a bad idea.
add 4971e2e TIKA-3137 add a list type for Param/configuration to avoid
the comma-delimited lists which will get huge and ugly and were a bad idea.
new bf224dc Merge remote-tracking branch 'origin/TIKA-3140' into main
The 1 revisions listed above as "new" are entirely new to this
repository and will be described in separate emails. The revisions
listed as "add" were already present in the repository and have only
been added to this reference.
Summary of changes:
.../src/main/java/org/apache/tika/cli/TikaCLI.java | 4 +-
.../batch/fs/RecursiveParserWrapperFSConsumer.java | 9 +-
.../tika/batch/fs/StreamOutRPWFSConsumer.java | 20 ++-
.../fs/builders/BasicTikaFSConsumersBuilder.java | 11 +-
.../RecursiveParserWrapperFSConsumerTest.java | 5 +-
.../main/java/org/apache/tika/config/Param.java | 70 +++++++--
.../java/org/apache/tika/config/TikaConfig.java | 115 +++++++++++++-
.../metadata/filter/ClearByMimeMetadataFilter.java | 72 +++++++++
.../metadata/filter/CompositeMetadataFilter.java | 23 +--
.../filter/DefaultMetadataFilter.java} | 38 +++--
.../filter/ExcludeFieldMetadataFilter.java | 41 +++--
.../filter/IncludeFieldMetadataFilter.java} | 54 +++----
.../tika/metadata/filter/MetadataFilter.java | 15 +-
.../apache/tika/metadata/filter/NoOpFilter.java | 21 ++-
.../tika/sax/RecursiveParserWrapperHandler.java | 31 +++-
.../org.apache.tika.metadata.filter.MetadataFilter | 2 +-
.../java/org/apache/tika/config/ParamTest.java | 7 +
.../org/apache/tika/config/TikaConfigTest.java | 2 +
.../tika/metadata/filter/MockUpperCaseFilter.java | 27 ++--
.../tika/metadata/filter/TestMetadataFilter.java | 170 +++++++++++++++++++++
.../tika/parser/ParameterizedParserTest.java | 3 +-
...3-vowel-parser-ae.xml => TIKA-3137-exclude.xml} | 13 +-
...owel-parser-ae.xml => TIKA-3137-include-uc.xml} | 14 +-
...3-vowel-parser-ae.xml => TIKA-3137-include.xml} | 13 +-
...-vowel-parser-ae.xml => TIKA-3137-mimes-uc.xml} | 14 +-
.../tika/eval/metadata/TikaEvalMetadataFilter.java | 104 +++++++++++++
.../eval/metadata/TikaEvalMetadataFilterTest.java | 51 +++++++
.../tika/parser/RecursiveParserWrapperTest.java | 43 ++++++
.../org/apache/tika/parser/TIKA-3137-include.xml | 22 ++-
.../server/resource/RecursiveMetadataResource.java | 3 +-
.../java/org/apache/tika/server/CXFTestBase.java | 7 +-
.../tika/server/RecursiveMetadataFilterTest.java | 108 +++++++++++++
.../org/apache/tika/server/TIKA-3137-include.xml | 22 ++-
33 files changed, 981 insertions(+), 173 deletions(-)
create mode 100644
tika-core/src/main/java/org/apache/tika/metadata/filter/ClearByMimeMetadataFilter.java
copy tika-server/src/main/java/org/apache/tika/server/MetadataList.java =>
tika-core/src/main/java/org/apache/tika/metadata/filter/CompositeMetadataFilter.java
(65%)
copy tika-core/src/main/java/org/apache/tika/{mime/OrClause.java =>
metadata/filter/DefaultMetadataFilter.java} (51%)
copy tika-fuzzing/src/main/java/org/apache/tika/fuzzing/Transformer.java =>
tika-core/src/main/java/org/apache/tika/metadata/filter/ExcludeFieldMetadataFilter.java
(53%)
copy
tika-core/src/main/java/org/apache/tika/{detect/NonDetectingEncodingDetector.java
=> metadata/filter/IncludeFieldMetadataFilter.java} (51%)
copy
tika-parsers/src/main/java/org/apache/tika/parser/utils/DataURISchemeParseException.java
=> tika-core/src/main/java/org/apache/tika/metadata/filter/MetadataFilter.java
(74%)
copy tika-server/src/main/java/org/apache/tika/server/MetadataList.java =>
tika-core/src/main/java/org/apache/tika/metadata/filter/NoOpFilter.java (69%)
copy
tika-parsers/src/main/resources/org/apache/tika/parser/ner/nltk/NLTKServer.properties
=>
tika-core/src/main/resources/META-INF/services/org.apache.tika.metadata.filter.MetadataFilter
(94%)
copy
tika-server/src/main/java/org/apache/tika/server/DefaultInputStreamFactory.java
=>
tika-core/src/test/java/org/apache/tika/metadata/filter/MockUpperCaseFilter.java
(61%)
create mode 100644
tika-core/src/test/java/org/apache/tika/metadata/filter/TestMetadataFilter.java
copy
tika-core/src/test/resources/org/apache/tika/config/{TIKA-2653-vowel-parser-ae.xml
=> TIKA-3137-exclude.xml} (76%)
copy
tika-core/src/test/resources/org/apache/tika/config/{TIKA-2653-vowel-parser-ae.xml
=> TIKA-3137-include-uc.xml} (70%)
copy
tika-core/src/test/resources/org/apache/tika/config/{TIKA-2653-vowel-parser-ae.xml
=> TIKA-3137-include.xml} (76%)
copy
tika-core/src/test/resources/org/apache/tika/config/{TIKA-2653-vowel-parser-ae.xml
=> TIKA-3137-mimes-uc.xml} (70%)
create mode 100644
tika-eval/src/main/java/org/apache/tika/eval/metadata/TikaEvalMetadataFilter.java
create mode 100644
tika-eval/src/test/java/org/apache/tika/eval/metadata/TikaEvalMetadataFilterTest.java
copy
tika-core/src/test/resources/org/apache/tika/config/TIKA-2653-vowel-parser-ae.xml
=>
tika-parsers/src/test/resources/org/apache/tika/parser/TIKA-3137-include.xml
(58%)
create mode 100644
tika-server/src/test/java/org/apache/tika/server/RecursiveMetadataFilterTest.java
copy
tika-core/src/test/resources/org/apache/tika/config/TIKA-2653-vowel-parser-ae.xml
=> tika-server/src/test/resources/org/apache/tika/server/TIKA-3137-include.xml
(58%)