[ 
https://issues.apache.org/jira/browse/FLINK-25026?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&focusedCommentId=17464800#comment-17464800
 ] 

Seth Wiesman commented on FLINK-25026:
--------------------------------------

https://dev.azure.com/apache-flink/apache-flink/_build/results?buildId=28549&view=logs&j=5c8e7682-d68f-54d1-16a2-a09310218a49&t=86f654fa-ab48-5c1a-25f4-7e7f6afb9bba

> UnalignedCheckpointRescaleITCase.shouldRescaleUnalignedCheckpoint fails on AZP
> ------------------------------------------------------------------------------
>
>                 Key: FLINK-25026
>                 URL: https://issues.apache.org/jira/browse/FLINK-25026
>             Project: Flink
>          Issue Type: Bug
>          Components: Runtime / Checkpointing
>    Affects Versions: 1.14.0
>            Reporter: Till Rohrmann
>            Priority: Major
>              Labels: test-stability
>             Fix For: 1.14.3
>
>
> {{UnalignedCheckpointRescaleITCase.shouldRescaleUnalignedCheckpoint}} fails 
> on AZP with
> {code}
> 2021-11-23T00:58:03.8286352Z Nov 23 00:58:03 [ERROR] Tests run: 72, Failures: 
> 0, Errors: 1, Skipped: 0, Time elapsed: 716.362 s <<< FAILURE! - in 
> org.apache.flink.test.checkpointing.UnalignedCheckpointRescaleITCase
> 2021-11-23T00:58:03.8288790Z Nov 23 00:58:03 [ERROR] 
> shouldRescaleUnalignedCheckpoint[downscale union from 3 to 2, 
> buffersPerChannel = 1]  Time elapsed: 4.051 s  <<< ERROR!
> 2021-11-23T00:58:03.8289953Z Nov 23 00:58:03 
> org.apache.flink.runtime.client.JobExecutionException: Job execution failed.
> 2021-11-23T00:58:03.8291473Z Nov 23 00:58:03  at 
> org.apache.flink.runtime.jobmaster.JobResult.toJobExecutionResult(JobResult.java:144)
> 2021-11-23T00:58:03.8292776Z Nov 23 00:58:03  at 
> org.apache.flink.test.checkpointing.UnalignedCheckpointTestBase.execute(UnalignedCheckpointTestBase.java:168)
> 2021-11-23T00:58:03.8294520Z Nov 23 00:58:03  at 
> org.apache.flink.test.checkpointing.UnalignedCheckpointRescaleITCase.shouldRescaleUnalignedCheckpoint(UnalignedCheckpointRescaleITCase.java:534)
> 2021-11-23T00:58:03.8295909Z Nov 23 00:58:03  at 
> jdk.internal.reflect.GeneratedMethodAccessor123.invoke(Unknown Source)
> 2021-11-23T00:58:03.8297310Z Nov 23 00:58:03  at 
> java.base/jdk.internal.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43)
> 2021-11-23T00:58:03.8298922Z Nov 23 00:58:03  at 
> java.base/java.lang.reflect.Method.invoke(Method.java:566)
> 2021-11-23T00:58:03.8300298Z Nov 23 00:58:03  at 
> org.junit.runners.model.FrameworkMethod$1.runReflectiveCall(FrameworkMethod.java:59)
> 2021-11-23T00:58:03.8301741Z Nov 23 00:58:03  at 
> org.junit.internal.runners.model.ReflectiveCallable.run(ReflectiveCallable.java:12)
> 2021-11-23T00:58:03.8303233Z Nov 23 00:58:03  at 
> org.junit.runners.model.FrameworkMethod.invokeExplosively(FrameworkMethod.java:56)
> 2021-11-23T00:58:03.8304514Z Nov 23 00:58:03  at 
> org.junit.internal.runners.statements.InvokeMethod.evaluate(InvokeMethod.java:17)
> 2021-11-23T00:58:03.8305736Z Nov 23 00:58:03  at 
> org.junit.rules.Verifier$1.evaluate(Verifier.java:35)
> 2021-11-23T00:58:03.8306856Z Nov 23 00:58:03  at 
> org.junit.rules.TestWatcher$1.evaluate(TestWatcher.java:61)
> 2021-11-23T00:58:03.8308218Z Nov 23 00:58:03  at 
> org.junit.rules.ExternalResource$1.evaluate(ExternalResource.java:54)
> 2021-11-23T00:58:03.8309532Z Nov 23 00:58:03  at 
> org.apache.flink.util.TestNameProvider$1.evaluate(TestNameProvider.java:45)
> 2021-11-23T00:58:03.8310780Z Nov 23 00:58:03  at 
> org.junit.rules.TestWatcher$1.evaluate(TestWatcher.java:61)
> 2021-11-23T00:58:03.8312026Z Nov 23 00:58:03  at 
> org.junit.runners.ParentRunner$3.evaluate(ParentRunner.java:306)
> 2021-11-23T00:58:03.8313515Z Nov 23 00:58:03  at 
> org.junit.runners.BlockJUnit4ClassRunner$1.evaluate(BlockJUnit4ClassRunner.java:100)
> 2021-11-23T00:58:03.8314842Z Nov 23 00:58:03  at 
> org.junit.runners.ParentRunner.runLeaf(ParentRunner.java:366)
> 2021-11-23T00:58:03.8316116Z Nov 23 00:58:03  at 
> org.junit.runners.BlockJUnit4ClassRunner.runChild(BlockJUnit4ClassRunner.java:103)
> 2021-11-23T00:58:03.8317538Z Nov 23 00:58:03  at 
> org.junit.runners.BlockJUnit4ClassRunner.runChild(BlockJUnit4ClassRunner.java:63)
> 2021-11-23T00:58:03.8320044Z Nov 23 00:58:03  at 
> org.junit.runners.ParentRunner$4.run(ParentRunner.java:331)
> 2021-11-23T00:58:03.8321044Z Nov 23 00:58:03  at 
> org.junit.runners.ParentRunner$1.schedule(ParentRunner.java:79)
> 2021-11-23T00:58:03.8321978Z Nov 23 00:58:03  at 
> org.junit.runners.ParentRunner.runChildren(ParentRunner.java:329)
> 2021-11-23T00:58:03.8322915Z Nov 23 00:58:03  at 
> org.junit.runners.ParentRunner.access$100(ParentRunner.java:66)
> 2021-11-23T00:58:03.8323848Z Nov 23 00:58:03  at 
> org.junit.runners.ParentRunner$2.evaluate(ParentRunner.java:293)
> 2021-11-23T00:58:03.8325330Z Nov 23 00:58:03  at 
> org.junit.runners.ParentRunner.run(ParentRunner.java:413)
> 2021-11-23T00:58:03.8337747Z Nov 23 00:58:03  at 
> org.junit.runners.Suite.runChild(Suite.java:128)
> 2021-11-23T00:58:03.8339178Z Nov 23 00:58:03  at 
> org.junit.runners.Suite.runChild(Suite.java:27)
> 2021-11-23T00:58:03.8340038Z Nov 23 00:58:03  at 
> org.junit.runners.ParentRunner$4.run(ParentRunner.java:331)
> 2021-11-23T00:58:03.8340967Z Nov 23 00:58:03  at 
> org.junit.runners.ParentRunner$1.schedule(ParentRunner.java:79)
> 2021-11-23T00:58:03.8341889Z Nov 23 00:58:03  at 
> org.junit.runners.ParentRunner.runChildren(ParentRunner.java:329)
> 2021-11-23T00:58:03.8342923Z Nov 23 00:58:03  at 
> org.junit.runners.ParentRunner.access$100(ParentRunner.java:66)
> 2021-11-23T00:58:03.8343842Z Nov 23 00:58:03  at 
> org.junit.runners.ParentRunner$2.evaluate(ParentRunner.java:293)
> 2021-11-23T00:58:03.8344979Z Nov 23 00:58:03  at 
> org.junit.runners.ParentRunner$3.evaluate(ParentRunner.java:306)
> 2021-11-23T00:58:03.8345869Z Nov 23 00:58:03  at 
> org.junit.runners.ParentRunner.run(ParentRunner.java:413)
> 2021-11-23T00:58:03.8346717Z Nov 23 00:58:03  at 
> org.junit.runner.JUnitCore.run(JUnitCore.java:137)
> 2021-11-23T00:58:03.8347642Z Nov 23 00:58:03  at 
> org.junit.runner.JUnitCore.run(JUnitCore.java:115)
> 2021-11-23T00:58:03.8348570Z Nov 23 00:58:03  at 
> org.junit.vintage.engine.execution.RunnerExecutor.execute(RunnerExecutor.java:43)
> 2021-11-23T00:58:03.8349582Z Nov 23 00:58:03  at 
> java.base/java.util.stream.ForEachOps$ForEachOp$OfRef.accept(ForEachOps.java:183)
> 2021-11-23T00:58:03.8350583Z Nov 23 00:58:03  at 
> java.base/java.util.stream.ReferencePipeline$3$1.accept(ReferencePipeline.java:195)
> 2021-11-23T00:58:03.8351521Z Nov 23 00:58:03  at 
> java.base/java.util.Iterator.forEachRemaining(Iterator.java:133)
> 2021-11-23T00:58:03.8352509Z Nov 23 00:58:03  at 
> java.base/java.util.Spliterators$IteratorSpliterator.forEachRemaining(Spliterators.java:1801)
> 2021-11-23T00:58:03.8353653Z Nov 23 00:58:03  at 
> java.base/java.util.stream.AbstractPipeline.copyInto(AbstractPipeline.java:484)
> 2021-11-23T00:58:03.8354667Z Nov 23 00:58:03  at 
> java.base/java.util.stream.AbstractPipeline.wrapAndCopyInto(AbstractPipeline.java:474)
> 2021-11-23T00:58:03.8355701Z Nov 23 00:58:03  at 
> java.base/java.util.stream.ForEachOps$ForEachOp.evaluateSequential(ForEachOps.java:150)
> 2021-11-23T00:58:03.8356744Z Nov 23 00:58:03  at 
> java.base/java.util.stream.ForEachOps$ForEachOp$OfRef.evaluateSequential(ForEachOps.java:173)
> 2021-11-23T00:58:03.8357943Z Nov 23 00:58:03  at 
> java.base/java.util.stream.AbstractPipeline.evaluate(AbstractPipeline.java:234)
> 2021-11-23T00:58:03.8358932Z Nov 23 00:58:03  at 
> java.base/java.util.stream.ReferencePipeline.forEach(ReferencePipeline.java:497)
> 2021-11-23T00:58:03.8359943Z Nov 23 00:58:03  at 
> org.junit.vintage.engine.VintageTestEngine.executeAllChildren(VintageTestEngine.java:82)
> 2021-11-23T00:58:03.8360971Z Nov 23 00:58:03  at 
> org.junit.vintage.engine.VintageTestEngine.execute(VintageTestEngine.java:73)
> 2021-11-23T00:58:03.8361986Z Nov 23 00:58:03  at 
> org.junit.platform.launcher.core.DefaultLauncher.execute(DefaultLauncher.java:220)
> 2021-11-23T00:58:03.8363143Z Nov 23 00:58:03  at 
> org.junit.platform.launcher.core.DefaultLauncher.lambda$execute$6(DefaultLauncher.java:188)
> 2021-11-23T00:58:03.8364237Z Nov 23 00:58:03  at 
> org.junit.platform.launcher.core.DefaultLauncher.withInterceptedStreams(DefaultLauncher.java:202)
> 2021-11-23T00:58:03.8365279Z Nov 23 00:58:03  at 
> org.junit.platform.launcher.core.DefaultLauncher.execute(DefaultLauncher.java:181)
> 2021-11-23T00:58:03.8366302Z Nov 23 00:58:03  at 
> org.junit.platform.launcher.core.DefaultLauncher.execute(DefaultLauncher.java:128)
> 2021-11-23T00:58:03.8367523Z Nov 23 00:58:03  at 
> org.apache.maven.surefire.junitplatform.JUnitPlatformProvider.invokeAllTests(JUnitPlatformProvider.java:150)
> 2021-11-23T00:58:03.8368587Z Nov 23 00:58:03  at 
> org.apache.maven.surefire.junitplatform.JUnitPlatformProvider.invoke(JUnitPlatformProvider.java:120)
> 2021-11-23T00:58:03.8369888Z Nov 23 00:58:03  at 
> org.apache.maven.surefire.booter.ForkedBooter.invokeProviderInSameClassLoader(ForkedBooter.java:384)
> 2021-11-23T00:58:03.8370965Z Nov 23 00:58:03  at 
> org.apache.maven.surefire.booter.ForkedBooter.runSuitesInProcess(ForkedBooter.java:345)
> 2021-11-23T00:58:03.8371971Z Nov 23 00:58:03  at 
> org.apache.maven.surefire.booter.ForkedBooter.execute(ForkedBooter.java:126)
> 2021-11-23T00:58:03.8373028Z Nov 23 00:58:03  at 
> org.apache.maven.surefire.booter.ForkedBooter.main(ForkedBooter.java:418)
> 2021-11-23T00:58:03.8374193Z Nov 23 00:58:03 Caused by: 
> org.apache.flink.runtime.JobException: Recovery is suppressed by 
> FixedDelayRestartBackoffTimeStrategy(maxNumberRestartAttempts=0, 
> backoffTimeMS=100)
> 2021-11-23T00:58:03.8375495Z Nov 23 00:58:03  at 
> org.apache.flink.runtime.executiongraph.failover.flip1.ExecutionFailureHandler.handleFailure(ExecutionFailureHandler.java:138)
> 2021-11-23T00:58:03.8376816Z Nov 23 00:58:03  at 
> org.apache.flink.runtime.executiongraph.failover.flip1.ExecutionFailureHandler.getFailureHandlingResult(ExecutionFailureHandler.java:82)
> 2021-11-23T00:58:03.8378373Z Nov 23 00:58:03  at 
> org.apache.flink.runtime.scheduler.DefaultScheduler.handleTaskFailure(DefaultScheduler.java:228)
> 2021-11-23T00:58:03.8379481Z Nov 23 00:58:03  at 
> org.apache.flink.runtime.scheduler.DefaultScheduler.maybeHandleTaskFailure(DefaultScheduler.java:218)
> 2021-11-23T00:58:03.8380644Z Nov 23 00:58:03  at 
> org.apache.flink.runtime.scheduler.DefaultScheduler.updateTaskExecutionStateInternal(DefaultScheduler.java:209)
> 2021-11-23T00:58:03.8381808Z Nov 23 00:58:03  at 
> org.apache.flink.runtime.scheduler.SchedulerBase.updateTaskExecutionState(SchedulerBase.java:682)
> 2021-11-23T00:58:03.8382989Z Nov 23 00:58:03  at 
> org.apache.flink.runtime.scheduler.SchedulerNG.updateTaskExecutionState(SchedulerNG.java:79)
> 2021-11-23T00:58:03.8384070Z Nov 23 00:58:03  at 
> org.apache.flink.runtime.jobmaster.JobMaster.updateTaskExecutionState(JobMaster.java:444)
> 2021-11-23T00:58:03.8385037Z Nov 23 00:58:03  at 
> jdk.internal.reflect.GeneratedMethodAccessor39.invoke(Unknown Source)
> 2021-11-23T00:58:03.8386030Z Nov 23 00:58:03  at 
> java.base/jdk.internal.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43)
> 2021-11-23T00:58:03.8387020Z Nov 23 00:58:03  at 
> java.base/java.lang.reflect.Method.invoke(Method.java:566)
> 2021-11-23T00:58:03.8388110Z Nov 23 00:58:03  at 
> org.apache.flink.runtime.rpc.akka.AkkaRpcActor.lambda$handleRpcInvocation$1(AkkaRpcActor.java:316)
> 2021-11-23T00:58:03.8389282Z Nov 23 00:58:03  at 
> org.apache.flink.runtime.concurrent.akka.ClassLoadingUtils.runWithContextClassLoader(ClassLoadingUtils.java:83)
> 2021-11-23T00:58:03.8390376Z Nov 23 00:58:03  at 
> org.apache.flink.runtime.rpc.akka.AkkaRpcActor.handleRpcInvocation(AkkaRpcActor.java:314)
> 2021-11-23T00:58:03.8391456Z Nov 23 00:58:03  at 
> org.apache.flink.runtime.rpc.akka.AkkaRpcActor.handleRpcMessage(AkkaRpcActor.java:217)
> 2021-11-23T00:58:03.8392539Z Nov 23 00:58:03  at 
> org.apache.flink.runtime.rpc.akka.FencedAkkaRpcActor.handleRpcMessage(FencedAkkaRpcActor.java:78)
> 2021-11-23T00:58:03.8393742Z Nov 23 00:58:03  at 
> org.apache.flink.runtime.rpc.akka.AkkaRpcActor.handleMessage(AkkaRpcActor.java:163)
> 2021-11-23T00:58:03.8394719Z Nov 23 00:58:03  at 
> akka.japi.pf.UnitCaseStatement.apply(CaseStatements.scala:24)
> 2021-11-23T00:58:03.8395626Z Nov 23 00:58:03  at 
> akka.japi.pf.UnitCaseStatement.apply(CaseStatements.scala:20)
> 2021-11-23T00:58:03.8396513Z Nov 23 00:58:03  at 
> scala.PartialFunction.applyOrElse(PartialFunction.scala:123)
> 2021-11-23T00:58:03.8397497Z Nov 23 00:58:03  at 
> scala.PartialFunction.applyOrElse$(PartialFunction.scala:122)
> 2021-11-23T00:58:03.8398435Z Nov 23 00:58:03  at 
> akka.japi.pf.UnitCaseStatement.applyOrElse(CaseStatements.scala:20)
> 2021-11-23T00:58:03.8399349Z Nov 23 00:58:03  at 
> scala.PartialFunction$OrElse.applyOrElse(PartialFunction.scala:171)
> 2021-11-23T00:58:03.8400292Z Nov 23 00:58:03  at 
> scala.PartialFunction$OrElse.applyOrElse(PartialFunction.scala:172)
> 2021-11-23T00:58:03.8401223Z Nov 23 00:58:03  at 
> scala.PartialFunction$OrElse.applyOrElse(PartialFunction.scala:172)
> 2021-11-23T00:58:03.8402260Z Nov 23 00:58:03  at 
> akka.actor.Actor.aroundReceive(Actor.scala:537)
> 2021-11-23T00:58:03.8403157Z Nov 23 00:58:03  at 
> akka.actor.Actor.aroundReceive$(Actor.scala:535)
> 2021-11-23T00:58:03.8404030Z Nov 23 00:58:03  at 
> akka.actor.AbstractActor.aroundReceive(AbstractActor.scala:220)
> 2021-11-23T00:58:03.8404934Z Nov 23 00:58:03  at 
> akka.actor.ActorCell.receiveMessage(ActorCell.scala:580)
> 2021-11-23T00:58:03.8405775Z Nov 23 00:58:03  at 
> akka.actor.ActorCell.invoke(ActorCell.scala:548)
> 2021-11-23T00:58:03.8406616Z Nov 23 00:58:03  at 
> akka.dispatch.Mailbox.processMailbox(Mailbox.scala:270)
> 2021-11-23T00:58:03.8407512Z Nov 23 00:58:03  at 
> akka.dispatch.Mailbox.run(Mailbox.scala:231)
> 2021-11-23T00:58:03.8408312Z Nov 23 00:58:03  at 
> akka.dispatch.Mailbox.exec(Mailbox.scala:243)
> 2021-11-23T00:58:03.8409185Z Nov 23 00:58:03  at 
> java.base/java.util.concurrent.ForkJoinTask.doExec(ForkJoinTask.java:290)
> 2021-11-23T00:58:03.8410322Z Nov 23 00:58:03  at 
> java.base/java.util.concurrent.ForkJoinPool$WorkQueue.topLevelExec(ForkJoinPool.java:1020)
> 2021-11-23T00:58:03.8411305Z Nov 23 00:58:03  at 
> java.base/java.util.concurrent.ForkJoinPool.scan(ForkJoinPool.java:1656)
> 2021-11-23T00:58:03.8412209Z Nov 23 00:58:03  at 
> java.base/java.util.concurrent.ForkJoinPool.runWorker(ForkJoinPool.java:1594)
> 2021-11-23T00:58:03.8413192Z Nov 23 00:58:03  at 
> java.base/java.util.concurrent.ForkJoinWorkerThread.run(ForkJoinWorkerThread.java:183)
> 2021-11-23T00:58:03.8415356Z Nov 23 00:58:03 Caused by: 
> org.apache.flink.runtime.io.network.netty.exception.LocalTransportException: 
> Direct buffer memory (connection to 'localhost/127.0.0.1:35630')
> 2021-11-23T00:58:03.8416790Z Nov 23 00:58:03  at 
> org.apache.flink.runtime.io.network.netty.CreditBasedPartitionRequestClientHandler.exceptionCaught(CreditBasedPartitionRequestClientHandler.java:177)
> 2021-11-23T00:58:03.8418297Z Nov 23 00:58:03  at 
> org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.invokeExceptionCaught(AbstractChannelHandlerContext.java:302)
> 2021-11-23T00:58:03.8419680Z Nov 23 00:58:03  at 
> org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.invokeExceptionCaught(AbstractChannelHandlerContext.java:281)
> 2021-11-23T00:58:03.8421026Z Nov 23 00:58:03  at 
> org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.fireExceptionCaught(AbstractChannelHandlerContext.java:273)
> 2021-11-23T00:58:03.8422366Z Nov 23 00:58:03  at 
> org.apache.flink.shaded.netty4.io.netty.channel.ChannelInboundHandlerAdapter.exceptionCaught(ChannelInboundHandlerAdapter.java:143)
> 2021-11-23T00:58:03.8423806Z Nov 23 00:58:03  at 
> org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.invokeExceptionCaught(AbstractChannelHandlerContext.java:302)
> 2021-11-23T00:58:03.8425153Z Nov 23 00:58:03  at 
> org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.invokeChannelActive(AbstractChannelHandlerContext.java:232)
> 2021-11-23T00:58:03.8426512Z Nov 23 00:58:03  at 
> org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.invokeChannelActive(AbstractChannelHandlerContext.java:216)
> 2021-11-23T00:58:03.8427954Z Nov 23 00:58:03  at 
> org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.fireChannelActive(AbstractChannelHandlerContext.java:209)
> 2021-11-23T00:58:03.8429271Z Nov 23 00:58:03  at 
> org.apache.flink.shaded.netty4.io.netty.channel.DefaultChannelPipeline$HeadContext.channelActive(DefaultChannelPipeline.java:1398)
> 2021-11-23T00:58:03.8430603Z Nov 23 00:58:03  at 
> org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.invokeChannelActive(AbstractChannelHandlerContext.java:230)
> 2021-11-23T00:58:03.8431934Z Nov 23 00:58:03  at 
> org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.invokeChannelActive(AbstractChannelHandlerContext.java:216)
> 2021-11-23T00:58:03.8433297Z Nov 23 00:58:03  at 
> org.apache.flink.shaded.netty4.io.netty.channel.DefaultChannelPipeline.fireChannelActive(DefaultChannelPipeline.java:895)
> 2021-11-23T00:58:03.8434775Z Nov 23 00:58:03  at 
> org.apache.flink.shaded.netty4.io.netty.channel.epoll.AbstractEpollChannel$AbstractEpollUnsafe.fulfillConnectPromise(AbstractEpollChannel.java:658)
> 2021-11-23T00:58:03.8436107Z Nov 23 00:58:03  at 
> org.apache.flink.shaded.netty4.io.netty.channel.epoll.AbstractEpollChannel$AbstractEpollUnsafe.finishConnect(AbstractEpollChannel.java:691)
> 2021-11-23T00:58:03.8437442Z Nov 23 00:58:03  at 
> org.apache.flink.shaded.netty4.io.netty.channel.epoll.AbstractEpollChannel$AbstractEpollUnsafe.epollOutReady(AbstractEpollChannel.java:567)
> 2021-11-23T00:58:03.8438654Z Nov 23 00:58:03  at 
> org.apache.flink.shaded.netty4.io.netty.channel.epoll.EpollEventLoop.processReady(EpollEventLoop.java:470)
> 2021-11-23T00:58:03.8439768Z Nov 23 00:58:03  at 
> org.apache.flink.shaded.netty4.io.netty.channel.epoll.EpollEventLoop.run(EpollEventLoop.java:378)
> 2021-11-23T00:58:03.8440960Z Nov 23 00:58:03  at 
> org.apache.flink.shaded.netty4.io.netty.util.concurrent.SingleThreadEventExecutor$4.run(SingleThreadEventExecutor.java:989)
> 2021-11-23T00:58:03.8442282Z Nov 23 00:58:03  at 
> org.apache.flink.shaded.netty4.io.netty.util.internal.ThreadExecutorMap$2.run(ThreadExecutorMap.java:74)
> 2021-11-23T00:58:03.8443317Z Nov 23 00:58:03  at 
> java.base/java.lang.Thread.run(Thread.java:829)
> 2021-11-23T00:58:03.8448100Z Nov 23 00:58:03 Caused by: 
> java.lang.OutOfMemoryError: Direct buffer memory. The direct out-of-memory 
> error has occurred. This can mean two things: either job(s) require(s) a 
> larger size of JVM direct memory or there is a direct memory leak. The direct 
> memory can be allocated by user code or some of its dependencies. In this 
> case 'taskmanager.memory.task.off-heap.size' configuration option should be 
> increased. Flink framework and its dependencies also consume the direct 
> memory, mostly for network communication. The most of network memory is 
> managed by Flink and should not result in out-of-memory error. In certain 
> special cases, in particular for jobs with high parallelism, the framework 
> may require more direct memory which is not managed by Flink. In this case 
> 'taskmanager.memory.framework.off-heap.size' configuration option should be 
> increased. If the error persists then there is probably a direct memory leak 
> in user code or some of its dependencies which has to be investigated and 
> fixed. The task executor has to be shutdown...
> 2021-11-23T00:58:03.8451299Z Nov 23 00:58:03  at 
> java.base/java.nio.Bits.reserveMemory(Bits.java:175)
> 2021-11-23T00:58:03.8452187Z Nov 23 00:58:03  at 
> java.base/java.nio.DirectByteBuffer.<init>(DirectByteBuffer.java:118)
> 2021-11-23T00:58:03.8453176Z Nov 23 00:58:03  at 
> java.base/java.nio.ByteBuffer.allocateDirect(ByteBuffer.java:317)
> 2021-11-23T00:58:03.8454212Z Nov 23 00:58:03  at 
> org.apache.flink.shaded.netty4.io.netty.buffer.PoolArena$DirectArena.allocateDirect(PoolArena.java:632)
> 2021-11-23T00:58:03.8455342Z Nov 23 00:58:03  at 
> org.apache.flink.shaded.netty4.io.netty.buffer.PoolArena$DirectArena.newChunk(PoolArena.java:607)
> 2021-11-23T00:58:03.8456445Z Nov 23 00:58:03  at 
> org.apache.flink.shaded.netty4.io.netty.buffer.PoolArena.allocateNormal(PoolArena.java:202)
> 2021-11-23T00:58:03.8457611Z Nov 23 00:58:03  at 
> org.apache.flink.shaded.netty4.io.netty.buffer.PoolArena.tcacheAllocateSmall(PoolArena.java:172)
> 2021-11-23T00:58:03.8458688Z Nov 23 00:58:03  at 
> org.apache.flink.shaded.netty4.io.netty.buffer.PoolArena.allocate(PoolArena.java:134)
> 2021-11-23T00:58:03.8459728Z Nov 23 00:58:03  at 
> org.apache.flink.shaded.netty4.io.netty.buffer.PoolArena.allocate(PoolArena.java:126)
> 2021-11-23T00:58:03.8460782Z Nov 23 00:58:03  at 
> org.apache.flink.shaded.netty4.io.netty.buffer.PooledByteBufAllocator.newDirectBuffer(PooledByteBufAllocator.java:395)
> 2021-11-23T00:58:03.8462013Z Nov 23 00:58:03  at 
> org.apache.flink.shaded.netty4.io.netty.buffer.AbstractByteBufAllocator.directBuffer(AbstractByteBufAllocator.java:187)
> 2021-11-23T00:58:03.8463326Z Nov 23 00:58:03  at 
> org.apache.flink.shaded.netty4.io.netty.buffer.AbstractByteBufAllocator.directBuffer(AbstractByteBufAllocator.java:178)
> 2021-11-23T00:58:03.8464695Z Nov 23 00:58:03  at 
> org.apache.flink.runtime.io.network.netty.BufferResponseDecoder.onChannelActive(BufferResponseDecoder.java:54)
> 2021-11-23T00:58:03.8465948Z Nov 23 00:58:03  at 
> org.apache.flink.runtime.io.network.netty.NettyMessageClientDecoderDelegate.channelActive(NettyMessageClientDecoderDelegate.java:74)
> 2021-11-23T00:58:03.8467368Z Nov 23 00:58:03  at 
> org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannelHandlerContext.invokeChannelActive(AbstractChannelHandlerContext.java:230)
> 2021-11-23T00:58:03.8468324Z Nov 23 00:58:03  ... 14 more
> {code}
> https://dev.azure.com/apache-flink/apache-flink/_build/results?buildId=26873&view=logs&j=b0a398c0-685b-599c-eb57-c8c2a771138e&t=747432ad-a576-5911-1e2a-68c6bedc248a&l=10771



--
This message was sent by Atlassian Jira
(v8.20.1#820001)

Reply via email to