skorotkov commented on code in PR #10178: URL: https://github.com/apache/ignite/pull/10178#discussion_r941987042
########## modules/core/src/test/java/org/apache/ignite/internal/processors/cache/transactions/TxRecoveryConcurrentOnPrimaryFailTest.java: ########## @@ -0,0 +1,171 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one or more + * contributor license agreements. See the NOTICE file distributed with + * this work for additional information regarding copyright ownership. + * The ASF licenses this file to You under the Apache License, Version 2.0 + * (the "License"); you may not use this file except in compliance with + * the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + +package org.apache.ignite.internal.processors.cache.transactions; + +import java.util.Collection; +import java.util.concurrent.BrokenBarrierException; +import java.util.concurrent.CyclicBarrier; +import org.apache.ignite.IgniteCache; +import org.apache.ignite.cache.affinity.rendezvous.RendezvousAffinityFunction; +import org.apache.ignite.configuration.CacheConfiguration; +import org.apache.ignite.configuration.IgniteConfiguration; +import org.apache.ignite.failure.StopNodeFailureHandler; +import org.apache.ignite.internal.IgniteEx; +import org.apache.ignite.internal.TestRecordingCommunicationSpi; +import org.apache.ignite.internal.processors.cache.distributed.dht.GridDhtTxFinishRequest; +import org.apache.ignite.testframework.GridTestUtils; +import org.apache.ignite.testframework.junits.common.GridCommonAbstractTest; +import org.apache.ignite.transactions.Transaction; +import org.junit.Test; + +import static org.apache.ignite.cache.CacheAtomicityMode.TRANSACTIONAL; +import static org.apache.ignite.cache.CacheMode.PARTITIONED; +import static org.apache.ignite.internal.TestRecordingCommunicationSpi.spi; +import static org.apache.ignite.testframework.GridTestUtils.runAsync; +import static org.apache.ignite.transactions.TransactionConcurrency.PESSIMISTIC; +import static org.apache.ignite.transactions.TransactionIsolation.REPEATABLE_READ; + +/** + * Tests concurrent execution of the tx recovery. + */ +public class TxRecoveryConcurrentOnPrimaryFailTest extends GridCommonAbstractTest { + /** {@inheritDoc} */ + @Override protected IgniteConfiguration getConfiguration(String name) throws Exception { + final IgniteConfiguration cfg = super.getConfiguration(name); + + cfg.setConsistentId(name); + + cfg.setCommunicationSpi(new TestRecordingCommunicationSpi()); + + cfg.setFailureHandler(new StopNodeFailureHandler()); + + cfg.setSystemThreadPoolSize(1); + + cfg.setStripedPoolSize(1); + + cfg.setCacheConfiguration(new CacheConfiguration<>(DEFAULT_CACHE_NAME).setCacheMode(PARTITIONED) + .setBackups(2).setAtomicityMode(TRANSACTIONAL).setAffinity(new RendezvousAffinityFunction(false, 1))); + + return cfg; + } + + /** {@inheritDoc} */ + @Override protected void afterTest() throws Exception { + super.afterTest(); + + stopAllGrids(); + } + + /** + * The test enforces the concurrent processing of the same prepared transaction + * both in the tx recovery procedure started due to primary node left and in the + * tx recovery request handler invoked by message from another backup node. + * <p> + * The idea is to have a 3-nodes cluster and a cache with 2 backups. So there + * will be 2 backup nodes to execute the tx recovery in parallel if primary one + * would fail. These backup nodes will send the tx recovery requests to each + * other, so the tx recovery request handler will be invoked as well. + * <p> + * Use several attempts to reproduce the race condition. + * <p> + * Expected result: transaction is finished on both backup nodes and the partition + * map exchange is completed as well. + */ + @Test + public void testRecoveryNotDeadLockOnPrimaryFail() throws Exception { + final IgniteEx grid0 = startGrid(0); + + final IgniteEx grid1 = startGrid(1); + + final CyclicBarrier grid1BlockerBarrier = new CyclicBarrier(3); + + final Runnable grid1BlockerTask = () -> { + try { + grid1BlockerBarrier.await(); + } + catch (InterruptedException | BrokenBarrierException e) { + // Just supress. + } + }; + + for (int iter = 0; iter < 100; iter++) { + final IgniteEx grid2 = startGrid(2); + + awaitPartitionMapExchange(); + + final IgniteCache<Object, Object> cache = grid2.cache(DEFAULT_CACHE_NAME); + + final Transaction tx = grid2.transactions().txStart(PESSIMISTIC, REPEATABLE_READ); + + // Key for which the grid2 node is primary. + final Integer grid2PrimaryKey = primaryKeys(cache, 1, 0).get(0); + + cache.put(grid2PrimaryKey, Boolean.TRUE); Review Comment: ok -- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. To unsubscribe, e-mail: [email protected] For queries about this service, please contact Infrastructure at: [email protected]
