[
https://issues.apache.org/jira/browse/IGNITE-22123?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&focusedCommentId=17842851#comment-17842851
]
Roman Puchkovskiy commented on IGNITE-22123:
--------------------------------------------
Are full logs available? Without them, there is nothing that can be said, just
'something went wrong, probably the JVM is overloaded with GC'
> Critical thread blocked on 2 node cluster with intensive create tables
> ----------------------------------------------------------------------
>
> Key: IGNITE-22123
> URL: https://issues.apache.org/jira/browse/IGNITE-22123
> Project: Ignite
> Issue Type: Bug
> Affects Versions: 3.0
> Reporter: Alexander Belyak
> Priority: Major
> Labels: ignite-3
>
> # Start 2 nodes cluster (I use single host for both nodes)
> # Connect to the first node and do in cycle:
> ## create table (different 8 columns PK)
> ## insert a few rows in it
> ## select a row from table
> Expected result: test pass without errors
> Actual result:
> client get:
> {noformat}
> 16:45:20.253 [junit-timeout-thread-119] INFO
> o.g.a.t.teststeps.ThinClientSteps - Query: drop table if exists
> eight_different_types_TINYINT_INTEGER_FLOAT_TINYINT_TINYINT_TINYINT_TINYINT_TINYINT
> Apr 26, 2024 4:45:20 PM org.apache.ignite.internal.logger.IgniteLogger
> logInternal
> INFO: Partition assignment change notification received
> [remoteAddress=localhost:10800]
> 16:45:20.266 [junit-timeout-thread-119] INFO
> o.g.a.t.teststeps.ThinClientSteps - Query: create table
> eight_different_types_TINYINT_INTEGER_FLOAT_TINYINT_TINYINT_TINYINT_TINYINT_TINYINT(keyTINYINT0
> TINYINT not null, keyINTEGER1 INTEGER not null, keyFLOAT2 FLOAT not null,
> keyTINYINT3 TINYINT not null, keyTINYINT4 TINYINT not null, keyTINYINT5
> TINYINT not null, keyTINYINT6 TINYINT not null, keyTINYINT7 TINYINT not null,
> val INTEGER not null, primary key (keyTINYINT0, keyINTEGER1, keyFLOAT2,
> keyTINYINT3, keyTINYINT4, keyTINYINT5, keyTINYINT6, keyTINYINT7))
> 16:45:28.570 [junit-timeout-thread-119] INFO
> o.g.a.t.teststeps.ThinClientSteps - Query: insert into
> eight_different_types_TINYINT_INTEGER_FLOAT_TINYINT_TINYINT_TINYINT_TINYINT_TINYINT(keyTINYINT0,
> keyINTEGER1, keyFLOAT2, keyTINYINT3, keyTINYINT4, keyTINYINT5, keyTINYINT6,
> keyTINYINT7, val) values (-96, 25781810, 5.0, -93, -92, -91, -90, -89,
> 116513)org.apache.ignite.sql.SqlException: IGN-PLACEMENTDRIVER-1
> TraceId:e21f4eb1-4ecb-4ea2-aaf7-62a08b677f20 Failed to get the primary
> replica [tablePartitionId=85_part_18, awaitTimestamp=HybridTimestamp
> [physical=2024-04-26 16:45:28:599 +0300, logical=0,
> composite=112337821931864064]]
> at
> java.base/java.lang.invoke.MethodHandle.invokeWithArguments(MethodHandle.java:710)
> at
> org.apache.ignite.internal.util.ExceptionUtils$1.copy(ExceptionUtils.java:765)
> at
> org.apache.ignite.internal.util.ExceptionUtils$ExceptionFactory.createCopy(ExceptionUtils.java:699)
> at
> org.apache.ignite.internal.util.ExceptionUtils.copyExceptionWithCause(ExceptionUtils.java:525)
> at
> org.apache.ignite.internal.util.ExceptionUtils.copyExceptionWithCauseInternal(ExceptionUtils.java:634)
> at
> org.apache.ignite.internal.util.ExceptionUtils.copyExceptionWithCause(ExceptionUtils.java:476)
> at
> org.apache.ignite.internal.client.sql.ClientSql.execute(ClientSql.java:94)
> at
> org.gridgain.ai3tests.tests.teststeps.ThinClientSteps.lambda$executeQuery$0(ThinClientSteps.java:61)
> at io.qameta.allure.Allure.lambda$step$1(Allure.java:127)
> at io.qameta.allure.Allure.step(Allure.java:181)
> at io.qameta.allure.Allure.step(Allure.java:125)
> at
> org.gridgain.ai3tests.tests.teststeps.ThinClientSteps.executeQuery(ThinClientSteps.java:61)
> at
> org.gridgain.ai3tests.tests.PrimaryKeyConstraintsTest.testTypes(PrimaryKeyConstraintsTest.java:167)
> at
> org.gridgain.ai3tests.tests.PrimaryKeyConstraintsTest.test8Columns(PrimaryKeyConstraintsTest.java:120)
> at java.base/java.lang.reflect.Method.invoke(Method.java:566)
> at
> io.qameta.allure.junit5.AllureJunit5.interceptTestTemplateMethod(AllureJunit5.java:59)
> at java.base/java.util.concurrent.FutureTask.run(FutureTask.java:264)
> at
> java.base/java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1128)
> at
> java.base/java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:628)
> at java.base/java.lang.Thread.run(Thread.java:829)
> Caused by: java.util.concurrent.CompletionException:
> org.apache.ignite.sql.SqlException: IGN-PLACEMENTDRIVER-1
> TraceId:e21f4eb1-4ecb-4ea2-aaf7-62a08b677f20 Failed to get the primary
> replica [tablePartitionId=85_part_18, awaitTimestamp=HybridTimestamp
> [physical=2024-04-26 16:45:28:599 +0300, logical=0,
> composite=112337821931864064]]
> at
> java.base/java.util.concurrent.CompletableFuture.encodeThrowable(CompletableFuture.java:331)
> at
> java.base/java.util.concurrent.CompletableFuture.completeThrowable(CompletableFuture.java:346)
> at
> java.base/java.util.concurrent.CompletableFuture.uniWhenComplete(CompletableFuture.java:870)
> at
> java.base/java.util.concurrent.CompletableFuture$UniWhenComplete.tryFire(CompletableFuture.java:837)
> at
> java.base/java.util.concurrent.CompletableFuture.postComplete(CompletableFuture.java:506)
> at
> java.base/java.util.concurrent.CompletableFuture.completeExceptionally(CompletableFuture.java:2094)
> at
> org.apache.ignite.internal.client.TcpClientChannel.processNextMessage(TcpClientChannel.java:419)
> at
> org.apache.ignite.internal.client.TcpClientChannel.lambda$onMessage$3(TcpClientChannel.java:238)
> at
> java.base/java.util.concurrent.ForkJoinTask$RunnableExecuteAction.exec(ForkJoinTask.java:1426)
> at
> java.base/java.util.concurrent.ForkJoinTask.doExec(ForkJoinTask.java:290)
> at
> java.base/java.util.concurrent.ForkJoinPool$WorkQueue.topLevelExec(ForkJoinPool.java:1020)
> at
> java.base/java.util.concurrent.ForkJoinPool.scan(ForkJoinPool.java:1656)
> at
> java.base/java.util.concurrent.ForkJoinPool.runWorker(ForkJoinPool.java:1594)
> at
> java.base/java.util.concurrent.ForkJoinWorkerThread.run(ForkJoinWorkerThread.java:183)
> Caused by: org.apache.ignite.sql.SqlException: IGN-PLACEMENTDRIVER-1
> TraceId:e21f4eb1-4ecb-4ea2-aaf7-62a08b677f20 Failed to get the primary
> replica [tablePartitionId=85_part_18, awaitTimestamp=HybridTimestamp
> [physical=2024-04-26 16:45:28:599 +0300, logical=0,
> composite=112337821931864064]]
> at
> java.base/java.lang.invoke.MethodHandle.invokeWithArguments(MethodHandle.java:710)
> at
> org.apache.ignite.internal.util.ExceptionUtils$1.copy(ExceptionUtils.java:765)
> at
> org.apache.ignite.internal.util.ExceptionUtils$ExceptionFactory.createCopy(ExceptionUtils.java:699)
> at
> org.apache.ignite.internal.util.ExceptionUtils.copyExceptionWithCause(ExceptionUtils.java:525)
> at
> org.apache.ignite.internal.client.TcpClientChannel.readError(TcpClientChannel.java:508)
> at
> org.apache.ignite.internal.client.TcpClientChannel.processNextMessage(TcpClientChannel.java:397)
> ... 7 more{noformat}
>
> in a server logs:
> {noformat}
> 2024-04-26 16:46:42:196 +0300
> [ERROR][%PrimaryKeyConstraintsTest_cluster_0%common-scheduler-0][CriticalWorkerWatchdog]
> A critical thread is blocked for 580 ms that is more than the allowed 500
> ms, it is "PrimaryKeyConstraintsTest_cluster_0-srv-worker-15" prio=10 Id=49
> RUNNABLE
> at [email protected]/sun.nio.ch.FileDispatcherImpl.write0(Native Method)
> at
> [email protected]/sun.nio.ch.SocketDispatcher.write(SocketDispatcher.java:62)
> at
> [email protected]/sun.nio.ch.IOUtil.writeFromNativeBuffer(IOUtil.java:137)
> at [email protected]/sun.nio.ch.IOUtil.write(IOUtil.java:81)
> at [email protected]/sun.nio.ch.IOUtil.write(IOUtil.java:58)
> at
> [email protected]/sun.nio.ch.SocketChannelImpl.write(SocketChannelImpl.java:532)
> at
> app//io.netty.channel.socket.nio.NioSocketChannel.doWrite(NioSocketChannel.java:415)
> at
> app//io.netty.channel.AbstractChannel$AbstractUnsafe.flush0(AbstractChannel.java:931)
> at
> app//io.netty.channel.nio.AbstractNioChannel$AbstractNioUnsafe.flush0(AbstractNioChannel.java:359)
> at
> app//io.netty.channel.AbstractChannel$AbstractUnsafe.flush(AbstractChannel.java:895)
> at
> app//io.netty.channel.DefaultChannelPipeline$HeadContext.flush(DefaultChannelPipeline.java:1372)
> at
> app//io.netty.channel.AbstractChannelHandlerContext.invokeFlush0(AbstractChannelHandlerContext.java:935)
> at
> app//io.netty.channel.AbstractChannelHandlerContext.invokeWriteAndFlush(AbstractChannelHandlerContext.java:957)
> at
> app//io.netty.channel.AbstractChannelHandlerContext.write(AbstractChannelHandlerContext.java:982)
> at
> app//io.netty.channel.AbstractChannelHandlerContext.writeAndFlush(AbstractChannelHandlerContext.java:950)
> at
> app//io.netty.channel.AbstractChannelHandlerContext.writeAndFlush(AbstractChannelHandlerContext.java:1000)
> at
> app//io.netty.handler.stream.ChunkedWriteHandler.doFlush(ChunkedWriteHandler.java:286)
> at
> app//io.netty.handler.stream.ChunkedWriteHandler.flush(ChunkedWriteHandler.java:146)
> at
> app//io.netty.channel.AbstractChannelHandlerContext.invokeFlush0(AbstractChannelHandlerContext.java:937)
> at
> app//io.netty.channel.AbstractChannelHandlerContext.invokeFlush(AbstractChannelHandlerContext.java:921)
> at
> app//io.netty.channel.AbstractChannelHandlerContext.flush(AbstractChannelHandlerContext.java:907)
> at
> app//io.netty.channel.ChannelOutboundHandlerAdapter.flush(ChannelOutboundHandlerAdapter.java:125)
> at
> app//io.netty.channel.AbstractChannelHandlerContext.invokeFlush0(AbstractChannelHandlerContext.java:939)
> at
> app//io.netty.channel.AbstractChannelHandlerContext.invokeWriteAndFlush(AbstractChannelHandlerContext.java:957)
> at
> app//io.netty.channel.AbstractChannelHandlerContext.write(AbstractChannelHandlerContext.java:982)
> at
> app//io.netty.channel.AbstractChannelHandlerContext.writeAndFlush(AbstractChannelHandlerContext.java:950)
> at
> app//io.netty.channel.AbstractChannelHandlerContext.writeAndFlush(AbstractChannelHandlerContext.java:1000)
> at
> app//io.netty.channel.DefaultChannelPipeline.writeAndFlush(DefaultChannelPipeline.java:1025)
> at
> app//io.netty.channel.AbstractChannel.writeAndFlush(AbstractChannel.java:306)
> at
> app//org.apache.ignite.internal.network.netty.NettySender.writeWithRecovery(NettySender.java:173)
> at
> app//org.apache.ignite.internal.network.netty.NettySender.lambda$send$1(NettySender.java:113)
> at
> app//org.apache.ignite.internal.network.netty.NettySender$$Lambda$1226/0x000000080135b9d8.run(Unknown
> Source)
> at
> app//io.netty.util.concurrent.AbstractEventExecutor.runTask(AbstractEventExecutor.java:173)
> at
> app//io.netty.util.concurrent.AbstractEventExecutor.safeExecute(AbstractEventExecutor.java:166)
> at
> app//io.netty.util.concurrent.SingleThreadEventExecutor.runAllTasks(SingleThreadEventExecutor.java:470)
> at app//io.netty.channel.nio.NioEventLoop.run(NioEventLoop.java:569)
> at
> app//io.netty.util.concurrent.SingleThreadEventExecutor$4.run(SingleThreadEventExecutor.java:997)
> at
> app//io.netty.util.internal.ThreadExecutorMap$2.run(ThreadExecutorMap.java:74)
> at
> app//io.netty.util.concurrent.FastThreadLocalRunnable.run(FastThreadLocalRunnable.java:30)
> at [email protected]/java.lang.Thread.run(Thread.java:833) Number of
> locked synchronizers = 1
> - java.util.concurrent.locks.ReentrantLock$NonfairSync@3d96d0f5
> {noformat}
--
This message was sent by Atlassian Jira
(v8.20.10#820010)