nick-michaels opened a new issue, #30177:
URL: https://github.com/apache/beam/issues/30177

   ### What happened?
   
   We have Beam pipeline running in Google Dataflow (Beam SDK version `2.49.0`) 
which digests PubSub topics and stream its data into BigQuery table. 
Periodically we observe `OUT_OF_RANGE` errors in the pipeline logs:
   ```
   Error message from worker: java.lang.RuntimeException: 
org.apache.beam.sdk.util.UserCodeException: java.lang.RuntimeException: 
com.google.api.gax.rpc.OutOfRangeException: io.grpc.StatusRuntimeException: 
OUT_OF_RANGE: Offset 4143 is beyond the end of the stream Entity: 
projects/staging/datasets/flows_dataset/tables/flow_status_v1/streams/Cic2Njc0MDVhMC0wMDAwLTIwNjMtOTE3MS04ODNkMjRmZWIxYmM6czc
           
org.apache.beam.runners.dataflow.worker.GroupAlsoByWindowsParDoFn$1.output(GroupAlsoByWindowsParDoFn.java:187)
           
org.apache.beam.runners.dataflow.worker.GroupAlsoByWindowFnRunner$1.outputWindowedValue(GroupAlsoByWindowFnRunner.java:108)
           
org.apache.beam.runners.dataflow.worker.repackaged.org.apache.beam.runners.core.ReduceFnRunner.lambda$onTrigger$1(ReduceFnRunner.java:1058)
           
org.apache.beam.runners.dataflow.worker.repackaged.org.apache.beam.runners.core.ReduceFnContextFactory$OnTriggerContextImpl.output(ReduceFnContextFactory.java:445)
           
org.apache.beam.runners.dataflow.worker.repackaged.org.apache.beam.runners.core.SystemReduceFn.onTrigger(SystemReduceFn.java:130)
           
org.apache.beam.runners.dataflow.worker.repackaged.org.apache.beam.runners.core.ReduceFnRunner.onTrigger(ReduceFnRunner.java:1061)
           
org.apache.beam.runners.dataflow.worker.repackaged.org.apache.beam.runners.core.ReduceFnRunner.emit(ReduceFnRunner.java:932)
           
org.apache.beam.runners.dataflow.worker.repackaged.org.apache.beam.runners.core.ReduceFnRunner.onTimers(ReduceFnRunner.java:793)
           
org.apache.beam.runners.dataflow.worker.StreamingGroupAlsoByWindowViaWindowSetFn.processElement(StreamingGroupAlsoByWindowViaWindowSetFn.java:97)
           
org.apache.beam.runners.dataflow.worker.StreamingGroupAlsoByWindowViaWindowSetFn.processElement(StreamingGroupAlsoByWindowViaWindowSetFn.java:43)
           
org.apache.beam.runners.dataflow.worker.GroupAlsoByWindowFnRunner.invokeProcessElement(GroupAlsoByWindowFnRunner.java:121)
           
org.apache.beam.runners.dataflow.worker.GroupAlsoByWindowFnRunner.processElement(GroupAlsoByWindowFnRunner.java:73)
           
org.apache.beam.runners.dataflow.worker.repackaged.org.apache.beam.runners.core.LateDataDroppingDoFnRunner.processElement(LateDataDroppingDoFnRunner.java:80)
           
org.apache.beam.runners.dataflow.worker.GroupAlsoByWindowsParDoFn.processElement(GroupAlsoByWindowsParDoFn.java:137)
           
org.apache.beam.runners.dataflow.worker.util.common.worker.ParDoOperation.process(ParDoOperation.java:44)
           
org.apache.beam.runners.dataflow.worker.util.common.worker.OutputReceiver.process(OutputReceiver.java:54)
           
org.apache.beam.runners.dataflow.worker.util.common.worker.ReadOperation.runReadLoop(ReadOperation.java:218)
           
org.apache.beam.runners.dataflow.worker.util.common.worker.ReadOperation.start(ReadOperation.java:169)
           
org.apache.beam.runners.dataflow.worker.util.common.worker.MapTaskExecutor.execute(MapTaskExecutor.java:83)
           
org.apache.beam.runners.dataflow.worker.StreamingDataflowWorker.process(StreamingDataflowWorker.java:1404)
           
org.apache.beam.runners.dataflow.worker.StreamingDataflowWorker.access$800(StreamingDataflowWorker.java:154)
           
org.apache.beam.runners.dataflow.worker.StreamingDataflowWorker$4.run(StreamingDataflowWorker.java:1044)
           
org.apache.beam.runners.dataflow.worker.util.BoundedQueueExecutor.lambda$executeLockHeld$0(BoundedQueueExecutor.java:133)
           
java.base/java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1136)
           
java.base/java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:635)
           java.base/java.lang.Thread.run(Thread.java:833)
   Caused by: org.apache.beam.sdk.util.UserCodeException: 
java.lang.RuntimeException: com.google.api.gax.rpc.OutOfRangeException: 
io.grpc.StatusRuntimeException: OUT_OF_RANGE: Offset 4143 is beyond the end of 
the stream Entity: 
projects/staging/datasets/flows_dataset/tables/flow_status_v1/streams/Cic2Njc0MDVhMC0wMDAwLTIwNjMtOTE3MS04ODNkMjRmZWIxYmM6czc
           
org.apache.beam.sdk.util.UserCodeException.wrap(UserCodeException.java:39)
           
org.apache.beam.sdk.io.gcp.bigquery.StorageApiFlushAndFinalizeDoFn$DoFnInvoker.invokeProcessElement(Unknown
 Source)
           
org.apache.beam.runners.dataflow.worker.repackaged.org.apache.beam.runners.core.SimpleDoFnRunner.invokeProcessElement(SimpleDoFnRunner.java:211)
           
org.apache.beam.runners.dataflow.worker.repackaged.org.apache.beam.runners.core.SimpleDoFnRunner.processElement(SimpleDoFnRunner.java:188)
           
org.apache.beam.runners.dataflow.worker.SimpleParDoFn.processElement(SimpleParDoFn.java:340)
           
org.apache.beam.runners.dataflow.worker.util.common.worker.ParDoOperation.process(ParDoOperation.java:44)
           
org.apache.beam.runners.dataflow.worker.util.common.worker.OutputReceiver.process(OutputReceiver.java:54)
           
org.apache.beam.runners.dataflow.worker.GroupAlsoByWindowsParDoFn$1.output(GroupAlsoByWindowsParDoFn.java:185)
           
org.apache.beam.runners.dataflow.worker.GroupAlsoByWindowFnRunner$1.outputWindowedValue(GroupAlsoByWindowFnRunner.java:108)
           
org.apache.beam.runners.dataflow.worker.repackaged.org.apache.beam.runners.core.ReduceFnRunner.lambda$onTrigger$1(ReduceFnRunner.java:1058)
           
org.apache.beam.runners.dataflow.worker.repackaged.org.apache.beam.runners.core.ReduceFnContextFactory$OnTriggerContextImpl.output(ReduceFnContextFactory.java:445)
           
org.apache.beam.runners.dataflow.worker.repackaged.org.apache.beam.runners.core.SystemReduceFn.onTrigger(SystemReduceFn.java:130)
           
org.apache.beam.runners.dataflow.worker.repackaged.org.apache.beam.runners.core.ReduceFnRunner.onTrigger(ReduceFnRunner.java:1061)
           
org.apache.beam.runners.dataflow.worker.repackaged.org.apache.beam.runners.core.ReduceFnRunner.emit(ReduceFnRunner.java:932)
           
org.apache.beam.runners.dataflow.worker.repackaged.org.apache.beam.runners.core.ReduceFnRunner.onTimers(ReduceFnRunner.java:793)
           
org.apache.beam.runners.dataflow.worker.StreamingGroupAlsoByWindowViaWindowSetFn.processElement(StreamingGroupAlsoByWindowViaWindowSetFn.java:97)
           
org.apache.beam.runners.dataflow.worker.StreamingGroupAlsoByWindowViaWindowSetFn.processElement(StreamingGroupAlsoByWindowViaWindowSetFn.java:43)
           
org.apache.beam.runners.dataflow.worker.GroupAlsoByWindowFnRunner.invokeProcessElement(GroupAlsoByWindowFnRunner.java:121)
           
org.apache.beam.runners.dataflow.worker.GroupAlsoByWindowFnRunner.processElement(GroupAlsoByWindowFnRunner.java:73)
           
org.apache.beam.runners.dataflow.worker.repackaged.org.apache.beam.runners.core.LateDataDroppingDoFnRunner.processElement(LateDataDroppingDoFnRunner.java:80)
           
org.apache.beam.runners.dataflow.worker.GroupAlsoByWindowsParDoFn.processElement(GroupAlsoByWindowsParDoFn.java:137)
           
org.apache.beam.runners.dataflow.worker.util.common.worker.ParDoOperation.process(ParDoOperation.java:44)
           
org.apache.beam.runners.dataflow.worker.util.common.worker.OutputReceiver.process(OutputReceiver.java:54)
           
org.apache.beam.runners.dataflow.worker.util.common.worker.ReadOperation.runReadLoop(ReadOperation.java:218)
           
org.apache.beam.runners.dataflow.worker.util.common.worker.ReadOperation.start(ReadOperation.java:169)
           
org.apache.beam.runners.dataflow.worker.util.common.worker.MapTaskExecutor.execute(MapTaskExecutor.java:83)
           
org.apache.beam.runners.dataflow.worker.StreamingDataflowWorker.process(StreamingDataflowWorker.java:1404)
           
org.apache.beam.runners.dataflow.worker.StreamingDataflowWorker.access$800(StreamingDataflowWorker.java:154)
           
org.apache.beam.runners.dataflow.worker.StreamingDataflowWorker$4.run(StreamingDataflowWorker.java:1044)
           
org.apache.beam.runners.dataflow.worker.util.BoundedQueueExecutor.lambda$executeLockHeld$0(BoundedQueueExecutor.java:133)
           
java.base/java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1136)
           
java.base/java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:635)
           java.base/java.lang.Thread.run(Thread.java:833)
   Caused by: java.lang.RuntimeException: 
com.google.api.gax.rpc.OutOfRangeException: io.grpc.StatusRuntimeException: 
OUT_OF_RANGE: Offset 4143 is beyond the end of the stream Entity: 
projects/staging/datasets/flows_dataset/tables/flow_status_v1/streams/Cic2Njc0MDVhMC0wMDAwLTIwNjMtOTE3MS04ODNkMjRmZWIxYmM6czc
           
org.apache.beam.sdk.io.gcp.bigquery.RetryManager.await(RetryManager.java:270)
           
org.apache.beam.sdk.io.gcp.bigquery.RetryManager.run(RetryManager.java:251)
           
org.apache.beam.sdk.io.gcp.bigquery.StorageApiFlushAndFinalizeDoFn.process(StorageApiFlushAndFinalizeDoFn.java:187)
   Caused by: com.google.api.gax.rpc.OutOfRangeException: 
io.grpc.StatusRuntimeException: OUT_OF_RANGE: Offset 4143 is beyond the end of 
the stream Entity: 
projects/staging/datasets/flows_dataset/tables/flow_status_v1/streams/Cic2Njc0MDVhMC0wMDAwLTIwNjMtOTE3MS04ODNkMjRmZWIxYmM6czc
           
com.google.api.gax.rpc.ApiExceptionFactory.createException(ApiExceptionFactory.java:106)
           
com.google.api.gax.rpc.ApiExceptionFactory.createException(ApiExceptionFactory.java:41)
           
com.google.api.gax.grpc.GrpcApiExceptionFactory.create(GrpcApiExceptionFactory.java:86)
           
com.google.api.gax.grpc.GrpcApiExceptionFactory.create(GrpcApiExceptionFactory.java:66)
           
com.google.api.gax.grpc.GrpcExceptionCallable$ExceptionTransformingFuture.onFailure(GrpcExceptionCallable.java:97)
           com.google.api.core.ApiFutures$1.onFailure(ApiFutures.java:84)
           
com.google.common.util.concurrent.Futures$CallbackListener.run(Futures.java:1127)
           
com.google.common.util.concurrent.DirectExecutor.execute(DirectExecutor.java:31)
           
com.google.common.util.concurrent.AbstractFuture.executeListener(AbstractFuture.java:1286)
           
com.google.common.util.concurrent.AbstractFuture.complete(AbstractFuture.java:1055)
           
com.google.common.util.concurrent.AbstractFuture.setException(AbstractFuture.java:807)
           
io.grpc.stub.ClientCalls$GrpcFuture.setException(ClientCalls.java:578)
           
io.grpc.stub.ClientCalls$UnaryStreamToFuture.onClose(ClientCalls.java:548)
           
io.grpc.PartialForwardingClientCallListener.onClose(PartialForwardingClientCallListener.java:39)
           
io.grpc.ForwardingClientCallListener.onClose(ForwardingClientCallListener.java:23)
           
io.grpc.ForwardingClientCallListener$SimpleForwardingClientCallListener.onClose(ForwardingClientCallListener.java:40)
           
com.google.api.gax.grpc.ChannelPool$ReleasingClientCall$1.onClose(ChannelPool.java:541)
           
io.grpc.PartialForwardingClientCallListener.onClose(PartialForwardingClientCallListener.java:39)
           
io.grpc.ForwardingClientCallListener.onClose(ForwardingClientCallListener.java:23)
           
io.grpc.ForwardingClientCallListener$SimpleForwardingClientCallListener.onClose(ForwardingClientCallListener.java:40)
           
io.grpc.census.CensusStatsModule$StatsClientInterceptor$1$1.onClose(CensusStatsModule.java:814)
           
io.grpc.PartialForwardingClientCallListener.onClose(PartialForwardingClientCallListener.java:39)
           
io.grpc.ForwardingClientCallListener.onClose(ForwardingClientCallListener.java:23)
           
io.grpc.ForwardingClientCallListener$SimpleForwardingClientCallListener.onClose(ForwardingClientCallListener.java:40)
           
io.grpc.census.CensusTracingModule$TracingClientInterceptor$1$1.onClose(CensusTracingModule.java:494)
           
io.grpc.internal.ClientCallImpl.closeObserver(ClientCallImpl.java:567)
           io.grpc.internal.ClientCallImpl.access$300(ClientCallImpl.java:71)
           
io.grpc.internal.ClientCallImpl$ClientStreamListenerImpl$1StreamClosed.runInternal(ClientCallImpl.java:735)
           
io.grpc.internal.ClientCallImpl$ClientStreamListenerImpl$1StreamClosed.runInContext(ClientCallImpl.java:716)
           io.grpc.internal.ContextRunnable.run(ContextRunnable.java:37)
           
io.grpc.internal.SerializingExecutor.run(SerializingExecutor.java:133)
           
java.base/java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1136)
           
java.base/java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:635)
           java.base/java.lang.Thread.run(Thread.java:833)
   Caused by: io.grpc.StatusRuntimeException: OUT_OF_RANGE: Offset 4143 is 
beyond the end of the stream Entity: 
projects/staging/datasets/flows_dataset/tables/flow_status_v1/streams/Cic2Njc0MDVhMC0wMDAwLTIwNjMtOTE3MS04ODNkMjRmZWIxYmM6czc
           io.grpc.Status.asRuntimeException(Status.java:539)
           
io.grpc.stub.ClientCalls$UnaryStreamToFuture.onClose(ClientCalls.java:548)
           
io.grpc.PartialForwardingClientCallListener.onClose(PartialForwardingClientCallListener.java:39)
           
io.grpc.ForwardingClientCallListener.onClose(ForwardingClientCallListener.java:23)
           
io.grpc.ForwardingClientCallListener$SimpleForwardingClientCallListener.onClose(ForwardingClientCallListener.java:40)
           
com.google.api.gax.grpc.ChannelPool$ReleasingClientCall$1.onClose(ChannelPool.java:541)
           
io.grpc.PartialForwardingClientCallListener.onClose(PartialForwardingClientCallListener.java:39)
           
io.grpc.ForwardingClientCallListener.onClose(ForwardingClientCallListener.java:23)
           
io.grpc.ForwardingClientCallListener$SimpleForwardingClientCallListener.onClose(ForwardingClientCallListener.java:40)
           
io.grpc.census.CensusStatsModule$StatsClientInterceptor$1$1.onClose(CensusStatsModule.java:814)
           
io.grpc.PartialForwardingClientCallListener.onClose(PartialForwardingClientCallListener.java:39)
           
io.grpc.ForwardingClientCallListener.onClose(ForwardingClientCallListener.java:23)
           
io.grpc.ForwardingClientCallListener$SimpleForwardingClientCallListener.onClose(ForwardingClientCallListener.java:40)
           
io.grpc.census.CensusTracingModule$TracingClientInterceptor$1$1.onClose(CensusTracingModule.java:494)
           
io.grpc.internal.ClientCallImpl.closeObserver(ClientCallImpl.java:567)
           io.grpc.internal.ClientCallImpl.access$300(ClientCallImpl.java:71)
           
io.grpc.internal.ClientCallImpl$ClientStreamListenerImpl$1StreamClosed.runInternal(ClientCallImpl.java:735)
           
io.grpc.internal.ClientCallImpl$ClientStreamListenerImpl$1StreamClosed.runInContext(ClientCallImpl.java:716)
           io.grpc.internal.ContextRunnable.run(ContextRunnable.java:37)
           
io.grpc.internal.SerializingExecutor.run(SerializingExecutor.java:133)
           
java.base/java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1136)
           
java.base/java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:635)
           java.base/java.lang.Thread.run(Thread.java:833)
   ```
   
   ### Issue Priority
   
   Priority: 2 (default / most bugs should be filed as P2)
   
   ### Issue Components
   
   - [ ] Component: Python SDK
   - [X] Component: Java SDK
   - [ ] Component: Go SDK
   - [ ] Component: Typescript SDK
   - [ ] Component: IO connector
   - [ ] Component: Beam YAML
   - [ ] Component: Beam examples
   - [ ] Component: Beam playground
   - [ ] Component: Beam katas
   - [ ] Component: Website
   - [ ] Component: Spark Runner
   - [ ] Component: Flink Runner
   - [ ] Component: Samza Runner
   - [ ] Component: Twister2 Runner
   - [ ] Component: Hazelcast Jet Runner
   - [X] Component: Google Cloud Dataflow Runner


-- 
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.

To unsubscribe, e-mail: github-unsubscr...@beam.apache.org.apache.org

For queries about this service, please contact Infrastructure at:
us...@infra.apache.org

Reply via email to