[ 
https://issues.apache.org/jira/browse/TIKA-3288?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&focusedCommentId=17278295#comment-17278295
 ] 

Hudson commented on TIKA-3288:
------------------------------

SUCCESS: Integrated in Jenkins build Tika » tika-main-jdk8 #147 (See 
[https://ci-builds.apache.org/job/Tika/job/tika-main-jdk8/147/])
TIKA-3288 (#401) (github: 
[https://github.com/apache/tika/commit/c7e184f83fceacd9059124bcb69fb356dd0190f7])
* (edit) 
tika-pipes/tika-pipes-integration-tests/src/test/java/org/apache/tika/pipes/PipeIntegrationTests.java
* (edit) 
tika-server/tika-server-core/src/main/java/org/apache/tika/server/core/TikaServerProcess.java
* (edit) 
tika-server/tika-server-classic/src/test/java/org/apache/tika/server/classic/TikaDetectorsTest.java
* (edit) 
tika-server/tika-server-core/src/main/java/org/apache/tika/server/core/resource/TikaResource.java
* (edit) 
tika-server/tika-server-core/src/test/java/org/apache/tika/server/core/TikaMimeTypesTest.java
* (edit) 
tika-server/tika-server-core/src/test/java/org/apache/tika/server/core/TikaServerStatusTest.java
* (edit) 
tika-pipes/tika-httpclient-commons/src/main/java/org/apache/tika/client/HttpClientUtil.java
* (delete) 
tika-serialization/src/main/java/org/apache/tika/metadata/serialization/JsonMetadataBase.java
* (edit) 
tika-serialization/src/main/java/org/apache/tika/metadata/serialization/JsonStreamingSerializer.java
* (add) 
tika-serialization/src/main/java/org/apache/tika/metadata/serialization/JsonEmitData.java
* (add) 
tika-serialization/src/test/java/org/apache/tika/metadata/serialization/JsonFetchEmitTupleListTest.java
* (edit) 
tika-server/tika-server-core/src/main/java/org/apache/tika/server/core/TikaServerCli.java
* (edit) 
tika-pipes/tika-emitters/tika-emitter-solr/src/main/java/org/apache/tika/pipes/emitter/solr/SolrEmitter.java
* (edit) 
tika-server/tika-server-core/src/main/java/org/apache/tika/server/core/writer/JSONObjWriter.java
* (edit) 
tika-serialization/src/main/java/org/apache/tika/metadata/serialization/JsonMetadata.java
* (edit) tika-core/src/main/java/org/apache/tika/pipes/emitter/EmitKey.java
* (add) 
tika-server/tika-server-core/src/main/java/org/apache/tika/server/core/resource/AsyncResource.java
* (edit) 
tika-server/tika-server-core/src/main/java/org/apache/tika/server/core/writer/JSONMessageBodyWriter.java
* (edit) 
tika-server/tika-server-core/src/main/java/org/apache/tika/server/core/writer/MetadataListMessageBodyWriter.java
* (edit) 
tika-pipes/tika-emitters/tika-emitter-fs/src/main/java/org/apache/tika/pipes/emitter/fs/FileSystemEmitter.java
* (edit) tika-serialization/pom.xml
* (delete) 
tika-serialization/src/main/java/org/apache/tika/metadata/serialization/JsonMetadataDeserializer.java
* (add) 
tika-server/tika-server-core/src/main/java/org/apache/tika/server/core/resource/AsyncEmitter.java
* (edit) 
tika-core/src/main/java/org/apache/tika/pipes/fetchiterator/FetchEmitTuple.java
* (edit) 
tika-serialization/src/test/java/org/apache/tika/metadata/serialization/JsonMetadataTest.java
* (add) tika-core/src/main/java/org/apache/tika/pipes/emitter/EmitData.java
* (add) 
tika-server/tika-server-core/src/test/java/org/apache/tika/server/core/TikaServerAsyncIntegrationTest.java
* (edit) 
tika-server/tika-server-client/src/main/java/org/apache/tika/server/client/TikaHttpClient.java
* (edit) 
tika-server/tika-server-core/src/test/java/org/apache/tika/server/core/TikaServerIntegrationTest.java
* (edit) tika-app/src/main/java/org/apache/tika/cli/TikaCLI.java
* (edit) tika-core/src/main/java/org/apache/tika/pipes/emitter/Emitter.java
* (edit) 
tika-pipes/tika-emitters/tika-emitter-solr/src/test/java/org/apache/tika/pipes/emitter/solr/TestBasic.java
* (add) 
tika-server/tika-server-core/src/main/java/org/apache/tika/server/core/resource/AsyncParser.java
* (edit) 
tika-server/tika-server-core/src/test/java/org/apache/tika/server/core/TikaServerEmitterIntegrationTest.java
* (edit) 
tika-server/tika-server-core/src/main/java/org/apache/tika/server/core/resource/MetadataResource.java
* (add) 
tika-serialization/src/test/java/org/apache/tika/metadata/serialization/JsonFetchEmitTupleTest.java
* (edit) 
tika-server/tika-server-core/src/main/java/org/apache/tika/server/core/ServerStatus.java
* (edit) 
tika-server/tika-server-core/src/main/java/org/apache/tika/server/core/resource/TikaMimeTypes.java
* (edit) 
tika-server/tika-server-classic/src/test/java/org/apache/tika/server/classic/TikaMimeTypesTest.java
* (add) 
tika-serialization/src/main/java/org/apache/tika/metadata/serialization/JsonFetchEmitTuple.java
* (edit) 
tika-server/tika-server-core/src/main/java/org/apache/tika/server/core/resource/RecursiveMetadataResource.java
* (edit) tika-server/tika-server-client/pom.xml
* (edit) 
tika-batch/src/test/java/org/apache/tika/batch/fs/HandlerBuilderTest.java
* (edit) tika-app/src/test/java/org/apache/tika/cli/TikaCLITest.java
* (edit) 
tika-serialization/src/test/java/org/apache/tika/metadata/serialization/JsonMetadataListTest.java
* (add) 
tika-serialization/src/main/java/org/apache/tika/metadata/serialization/JsonFetchEmitTupleList.java
* (edit) 
tika-server/tika-server-classic/src/test/java/org/apache/tika/server/classic/TikaParsersTest.java
* (edit) 
tika-core/src/main/java/org/apache/tika/pipes/fetchiterator/FetchIterator.java
* (edit) 
tika-server/tika-server-client/src/main/java/org/apache/tika/server/client/TikaClient.java
* (edit) 
tika-server/tika-server-core/src/main/java/org/apache/tika/server/core/resource/UnpackerResource.java
* (edit) tika-pipes/tika-emitters/tika-emitter-solr/pom.xml
* (edit) tika-core/src/main/java/org/apache/tika/pipes/emitter/EmptyEmitter.java
* (edit) tika-pipes/tika-httpclient-commons/pom.xml
* (edit) 
tika-server/tika-server-client/src/main/java/org/apache/tika/server/client/TikaClientCLI.java
* (edit) 
tika-server/tika-server-core/src/main/java/org/apache/tika/server/core/resource/EmitterResource.java
* (edit) 
tika-eval/tika-eval-app/src/test/resources/test-dirs/extractsA/file1.pdf.json
* (edit) 
tika-server/tika-server-core/src/main/java/org/apache/tika/server/core/resource/TikaDetectors.java
* (add) 
tika-server/tika-server-core/src/main/java/org/apache/tika/server/core/resource/AsyncRequest.java
* (edit) 
tika-pipes/tika-emitters/tika-emitter-s3/src/main/java/org/apache/tika/pipes/emitter/s3/S3Emitter.java
* (edit) 
tika-pipes/tika-fetch-iterators/tika-fetch-iterator-s3/src/main/java/org/apache/tika/pipes/fetchiterator/s3/S3FetchIterator.java
* (edit) 
tika-pipes/tika-fetch-iterators/tika-fetch-iterator-jdbc/src/main/java/org/apache/tika/pipes/fetchiterator/jdbc/JDBCFetchIterator.java
* (edit) 
tika-server/tika-server-core/src/test/java/org/apache/tika/server/core/TikaEmitterTest.java
* (edit) 
tika-serialization/src/main/java/org/apache/tika/metadata/serialization/JsonMetadataList.java
* (edit) 
tika-server/tika-server-core/src/main/java/org/apache/tika/server/core/resource/TikaParsers.java
* (edit) tika-eval/tika-eval-core/pom.xml
* (edit) 
tika-pipes/tika-fetch-iterators/tika-fetch-iterator-csv/src/main/java/org/apache/tika/pipes/fetchiterator/csv/CSVFetchIterator.java
* (edit) 
tika-server/tika-server-core/src/main/java/org/apache/tika/server/core/ServerStatusWatcher.java
* (edit) 
tika-core/src/main/java/org/apache/tika/pipes/emitter/AbstractEmitter.java
* (edit) 
tika-eval/tika-eval-app/src/main/java/org/apache/tika/eval/app/io/ExtractReader.java
* (edit) 
tika-serialization/src/main/java/org/apache/tika/metadata/serialization/PrettyMetadataKeyComparator.java
* (delete) 
tika-serialization/src/main/java/org/apache/tika/metadata/serialization/JsonMetadataSerializer.java


> Allow batching for emitters
> ---------------------------
>
>                 Key: TIKA-3288
>                 URL: https://issues.apache.org/jira/browse/TIKA-3288
>             Project: Tika
>          Issue Type: Task
>          Components: tika-pipes
>            Reporter: Tim Allison
>            Priority: Major
>
> Started an interface in comments: 
> [https://github.com/apache/tika/blob/main/tika-core/src/main/java/org/apache/tika/pipes/emitter/Emitter.java#L34]
>  
> The AbstractEmitter can keep track of "batch size" – how many bytes are in 
> the batch.  The caller can check for that after each addition and then call 
> executeBatch, or at the end of the task list.
>  
> We'll have to have a separate handler in tika-server `async-emit` ( ? ) to 
> handle this.



--
This message was sent by Atlassian Jira
(v8.3.4#803005)

Reply via email to