[ 
https://issues.apache.org/jira/browse/FLINK-18148?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&focusedCommentId=17126479#comment-17126479
 ] 

Robert Metzger commented on FLINK-18148:
----------------------------------------

{code}
2020-06-04T20:45:26.8965495Z 2020-06-04 20:43:17,927 WARN  
org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannel [] - 
Force-closing a channel whose registration task was not accepted by an event 
loop: [id: 0x19b77503]
2020-06-04T20:45:26.8966167Z java.util.concurrent.RejectedExecutionException: 
event executor terminated
2020-06-04T20:45:26.8967054Z    at 
org.apache.flink.shaded.netty4.io.netty.util.concurrent.SingleThreadEventExecutor.reject(SingleThreadEventExecutor.java:855)
 ~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.8968164Z    at 
org.apache.flink.shaded.netty4.io.netty.util.concurrent.SingleThreadEventExecutor.offerTask(SingleThreadEventExecutor.java:340)
 ~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.8969809Z    at 
org.apache.flink.shaded.netty4.io.netty.util.concurrent.SingleThreadEventExecutor.addTask(SingleThreadEventExecutor.java:333)
 ~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.8971146Z    at 
org.apache.flink.shaded.netty4.io.netty.util.concurrent.SingleThreadEventExecutor.execute(SingleThreadEventExecutor.java:766)
 ~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.8972368Z    at 
org.apache.flink.shaded.netty4.io.netty.channel.AbstractChannel$AbstractUnsafe.register(AbstractChannel.java:472)
 ~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.8980429Z    at 
org.apache.flink.shaded.netty4.io.netty.channel.SingleThreadEventLoop.register(SingleThreadEventLoop.java:87)
 ~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.8981747Z    at 
org.apache.flink.shaded.netty4.io.netty.channel.SingleThreadEventLoop.register(SingleThreadEventLoop.java:81)
 ~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.8982893Z    at 
org.apache.flink.shaded.netty4.io.netty.channel.MultithreadEventLoopGroup.register(MultithreadEventLoopGroup.java:86)
 ~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.8987906Z    at 
org.apache.flink.shaded.netty4.io.netty.bootstrap.AbstractBootstrap.initAndRegister(AbstractBootstrap.java:322)
 ~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.8989457Z    at 
org.apache.flink.shaded.netty4.io.netty.bootstrap.Bootstrap.doResolveAndConnect(Bootstrap.java:159)
 ~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.8990418Z    at 
org.apache.flink.shaded.netty4.io.netty.bootstrap.Bootstrap.connect(Bootstrap.java:143)
 ~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.8991327Z    at 
org.apache.flink.shaded.netty4.io.netty.bootstrap.Bootstrap.connect(Bootstrap.java:127)
 ~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.8992214Z    at 
org.apache.flink.runtime.rest.RestClient.submitRequest(RestClient.java:333) 
~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.8993075Z    at 
org.apache.flink.runtime.rest.RestClient.sendRequest(RestClient.java:272) 
~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.8994034Z    at 
org.apache.flink.runtime.rest.RestClient.sendRequest(RestClient.java:214) 
~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.8994967Z    at 
org.apache.flink.client.program.rest.RestClusterClient.lambda$null$23(RestClusterClient.java:666)
 ~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.8995554Z    at 
java.util.concurrent.CompletableFuture.uniCompose(CompletableFuture.java:966) 
[?:1.8.0_252]
2020-06-04T20:45:26.8996060Z    at 
java.util.concurrent.CompletableFuture$UniCompose.tryFire(CompletableFuture.java:940)
 [?:1.8.0_252]
2020-06-04T20:45:26.9000099Z    at 
java.util.concurrent.CompletableFuture.postComplete(CompletableFuture.java:488) 
[?:1.8.0_252]
2020-06-04T20:45:26.9000612Z    at 
java.util.concurrent.CompletableFuture.postFire(CompletableFuture.java:575) 
[?:1.8.0_252]
2020-06-04T20:45:26.9001111Z    at 
java.util.concurrent.CompletableFuture$UniApply.tryFire(CompletableFuture.java:594)
 [?:1.8.0_252]
2020-06-04T20:45:26.9001612Z    at 
java.util.concurrent.CompletableFuture$Completion.run(CompletableFuture.java:456)
 [?:1.8.0_252]
2020-06-04T20:45:26.9002114Z    at 
java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149) 
[?:1.8.0_252]
2020-06-04T20:45:26.9002610Z    at 
java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624) 
[?:1.8.0_252]
2020-06-04T20:45:26.9003010Z    at java.lang.Thread.run(Thread.java:748) 
[?:1.8.0_252]
2020-06-04T20:45:26.9003944Z 2020-06-04 20:43:17,933 ERROR 
org.apache.flink.shaded.netty4.io.netty.util.concurrent.DefaultPromise.rejectedExecution
 [] - Failed to submit a listener notification task. Event loop shut down?
2020-06-04T20:45:26.9004509Z java.util.concurrent.RejectedExecutionException: 
event executor terminated
2020-06-04T20:45:26.9005413Z    at 
org.apache.flink.shaded.netty4.io.netty.util.concurrent.SingleThreadEventExecutor.reject(SingleThreadEventExecutor.java:855)
 ~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.9006648Z    at 
org.apache.flink.shaded.netty4.io.netty.util.concurrent.SingleThreadEventExecutor.offerTask(SingleThreadEventExecutor.java:340)
 ~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.9007807Z    at 
org.apache.flink.shaded.netty4.io.netty.util.concurrent.SingleThreadEventExecutor.addTask(SingleThreadEventExecutor.java:333)
 ~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.9008903Z    at 
org.apache.flink.shaded.netty4.io.netty.util.concurrent.SingleThreadEventExecutor.execute(SingleThreadEventExecutor.java:766)
 ~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.9013958Z    at 
org.apache.flink.shaded.netty4.io.netty.util.concurrent.DefaultPromise.safeExecute(DefaultPromise.java:764)
 ~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.9015352Z    at 
org.apache.flink.shaded.netty4.io.netty.util.concurrent.DefaultPromise.notifyListeners(DefaultPromise.java:421)
 ~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.9016498Z    at 
org.apache.flink.shaded.netty4.io.netty.util.concurrent.DefaultPromise.addListener(DefaultPromise.java:149)
 ~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.9017611Z    at 
org.apache.flink.shaded.netty4.io.netty.channel.DefaultChannelPromise.addListener(DefaultChannelPromise.java:95)
 ~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.9022680Z    at 
org.apache.flink.shaded.netty4.io.netty.channel.DefaultChannelPromise.addListener(DefaultChannelPromise.java:30)
 ~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.9023773Z    at 
org.apache.flink.runtime.rest.RestClient.submitRequest(RestClient.java:337) 
~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.9024636Z    at 
org.apache.flink.runtime.rest.RestClient.sendRequest(RestClient.java:272) 
~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.9025475Z    at 
org.apache.flink.runtime.rest.RestClient.sendRequest(RestClient.java:214) 
~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.9027095Z    at 
org.apache.flink.client.program.rest.RestClusterClient.lambda$null$23(RestClusterClient.java:666)
 ~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.9027708Z    at 
java.util.concurrent.CompletableFuture.uniCompose(CompletableFuture.java:966) 
[?:1.8.0_252]
2020-06-04T20:45:26.9028213Z    at 
java.util.concurrent.CompletableFuture$UniCompose.tryFire(CompletableFuture.java:940)
 [?:1.8.0_252]
2020-06-04T20:45:26.9028722Z    at 
java.util.concurrent.CompletableFuture.postComplete(CompletableFuture.java:488) 
[?:1.8.0_252]
2020-06-04T20:45:26.9029378Z    at 
java.util.concurrent.CompletableFuture.postFire(CompletableFuture.java:575) 
[?:1.8.0_252]
2020-06-04T20:45:26.9033740Z    at 
java.util.concurrent.CompletableFuture$UniApply.tryFire(CompletableFuture.java:594)
 [?:1.8.0_252]
2020-06-04T20:45:26.9034425Z    at 
java.util.concurrent.CompletableFuture$Completion.run(CompletableFuture.java:456)
 [?:1.8.0_252]
2020-06-04T20:45:26.9034968Z    at 
java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149) 
[?:1.8.0_252]
2020-06-04T20:45:26.9035508Z    at 
java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624) 
[?:1.8.0_252]
2020-06-04T20:45:26.9035945Z    at java.lang.Thread.run(Thread.java:748) 
[?:1.8.0_252]
2020-06-04T20:45:26.9036840Z 2020-06-04 20:43:17,934 ERROR 
org.apache.flink.client.cli.CliFrontend                      [] - Error while 
running the command.
2020-06-04T20:45:26.9037389Z org.apache.flink.util.FlinkException: Could not 
stop with a savepoint job "44312127344716c7caf340918231aeaa".
2020-06-04T20:45:26.9038264Z    at 
org.apache.flink.client.cli.CliFrontend.lambda$stop$5(CliFrontend.java:495) 
~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.9043465Z    at 
org.apache.flink.client.cli.CliFrontend.runClusterAction(CliFrontend.java:864) 
~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.9044395Z    at 
org.apache.flink.client.cli.CliFrontend.stop(CliFrontend.java:487) 
~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.9045470Z    at 
org.apache.flink.client.cli.CliFrontend.parseParameters(CliFrontend.java:931) 
~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.9046472Z    at 
org.apache.flink.client.cli.CliFrontend.lambda$main$10(CliFrontend.java:992) 
~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.9047493Z    at 
org.apache.flink.runtime.security.contexts.NoOpSecurityContext.runSecured(NoOpSecurityContext.java:30)
 [flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.9048451Z    at 
org.apache.flink.client.cli.CliFrontend.main(CliFrontend.java:992) 
[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.9048920Z Caused by: java.util.concurrent.TimeoutException
2020-06-04T20:45:26.9049343Z    at 
java.util.concurrent.CompletableFuture.timedGet(CompletableFuture.java:1784) 
~[?:1.8.0_252]
2020-06-04T20:45:26.9049846Z    at 
java.util.concurrent.CompletableFuture.get(CompletableFuture.java:1928) 
~[?:1.8.0_252]
2020-06-04T20:45:26.9054664Z    at 
org.apache.flink.client.cli.CliFrontend.lambda$stop$5(CliFrontend.java:493) 
~[flink-dist_2.11-1.11-SNAPSHOT.jar:1.11-SNAPSHOT]
2020-06-04T20:45:26.9055247Z    ... 6 more
{code}
https://dev.azure.com/apache-flink/apache-flink/_build/results?buildId=2759&view=logs&j=91bf6583-3fb2-592f-e4d4-d79d79c3230a&t=94459a52-42b6-5bfc-5d74-690b5d3c6de8

> "Resuming Savepoint" e2e fails with TimeoutException in CliFrontend.stop() 
> ---------------------------------------------------------------------------
>
>                 Key: FLINK-18148
>                 URL: https://issues.apache.org/jira/browse/FLINK-18148
>             Project: Flink
>          Issue Type: Bug
>          Components: Command Line Client
>    Affects Versions: 1.11.0
>            Reporter: Robert Metzger
>            Priority: Major
>              Labels: test-stability
>
> https://dev.azure.com/apache-flink/apache-flink/_build/results?buildId=2759&view=logs&j=c88eea3b-64a0-564d-0031-9fdcd7b8abee&t=1e2bbe5b-4657-50be-1f07-d84bfce5b1f5
> {code}
> ------------------------------------------------------------
>  The program finished with the following exception:
> org.apache.flink.util.FlinkException: Could not stop with a savepoint job 
> "081bda854bc250e01055ed1ba9d43178".
>       at 
> org.apache.flink.client.cli.CliFrontend.lambda$stop$5(CliFrontend.java:495)
>       at 
> org.apache.flink.client.cli.CliFrontend.runClusterAction(CliFrontend.java:864)
>       at org.apache.flink.client.cli.CliFrontend.stop(CliFrontend.java:487)
>       at 
> org.apache.flink.client.cli.CliFrontend.parseParameters(CliFrontend.java:931)
>       at 
> org.apache.flink.client.cli.CliFrontend.lambda$main$10(CliFrontend.java:992)
>       at 
> org.apache.flink.runtime.security.contexts.NoOpSecurityContext.runSecured(NoOpSecurityContext.java:30)
>       at org.apache.flink.client.cli.CliFrontend.main(CliFrontend.java:992)
> Caused by: java.util.concurrent.TimeoutException
>       at 
> java.util.concurrent.CompletableFuture.timedGet(CompletableFuture.java:1784)
>       at 
> java.util.concurrent.CompletableFuture.get(CompletableFuture.java:1928)
>       at 
> org.apache.flink.client.cli.CliFrontend.lambda$stop$5(CliFrontend.java:493)
>       ... 6 more
> Waiting for job (081bda854bc250e01055ed1ba9d43178) to reach terminal state 
> FINISHED ...
> Job (081bda854bc250e01055ed1ba9d43178) reached terminal state FINISHED
> Savepoint location was empty. This may mean that the stop-with-savepoint 
> failed.
> [FAIL] Test script contains errors.
> {code}



--
This message was sent by Atlassian Jira
(v8.3.4#803005)

Reply via email to