| /* |
| * Licensed to the Apache Software Foundation (ASF) under one or more |
| * contributor license agreements. See the NOTICE file distributed with |
| * this work for additional information regarding copyright ownership. |
| * The ASF licenses this file to You under the Apache License, Version 2.0 |
| * (the "License"); you may not use this file except in compliance with |
| * the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| package org.apache.ignite.internal.processors.cache.distributed; |
| |
| import java.util.ArrayList; |
| import java.util.Collection; |
| import java.util.Collections; |
| import java.util.HashMap; |
| import java.util.HashSet; |
| import java.util.Map; |
| import java.util.Optional; |
| import java.util.Set; |
| import java.util.UUID; |
| import java.util.concurrent.Callable; |
| import java.util.concurrent.TimeUnit; |
| import java.util.stream.StreamSupport; |
| import org.apache.ignite.Ignite; |
| import org.apache.ignite.IgniteCache; |
| import org.apache.ignite.IgniteException; |
| import org.apache.ignite.Ignition; |
| import org.apache.ignite.cache.CacheMode; |
| import org.apache.ignite.cluster.ClusterNode; |
| import org.apache.ignite.configuration.CacheConfiguration; |
| import org.apache.ignite.configuration.IgniteConfiguration; |
| import org.apache.ignite.internal.IgniteEx; |
| import org.apache.ignite.internal.IgniteKernal; |
| import org.apache.ignite.internal.managers.communication.GridIoMessage; |
| import org.apache.ignite.internal.processors.cache.GridCacheAbstractSelfTest; |
| import org.apache.ignite.internal.processors.cache.GridCacheAdapter; |
| import org.apache.ignite.internal.processors.cache.GridCacheContext; |
| import org.apache.ignite.internal.processors.cache.IgniteCacheOffheapManager; |
| import org.apache.ignite.internal.processors.cache.distributed.near.GridNearCacheAdapter; |
| import org.apache.ignite.internal.processors.cache.distributed.near.GridNearTxLocal; |
| import org.apache.ignite.internal.processors.cache.transactions.IgniteTxManager; |
| import org.apache.ignite.internal.processors.cache.transactions.TransactionProxyImpl; |
| import org.apache.ignite.internal.util.lang.GridAbsPredicate; |
| import org.apache.ignite.internal.util.typedef.F; |
| import org.apache.ignite.internal.util.typedef.G; |
| import org.apache.ignite.lang.IgniteCallable; |
| import org.apache.ignite.lang.IgniteFuture; |
| import org.apache.ignite.lang.IgniteFutureTimeoutException; |
| import org.apache.ignite.lang.IgniteInClosure; |
| import org.apache.ignite.plugin.extensions.communication.Message; |
| import org.apache.ignite.resources.IgniteInstanceResource; |
| import org.apache.ignite.spi.IgniteSpiException; |
| import org.apache.ignite.spi.communication.tcp.TcpCommunicationSpi; |
| import org.apache.ignite.testframework.GridTestUtils; |
| import org.apache.ignite.transactions.Transaction; |
| import org.junit.Test; |
| |
| import static org.apache.ignite.cache.CacheAtomicityMode.TRANSACTIONAL_SNAPSHOT; |
| import static org.apache.ignite.transactions.TransactionConcurrency.PESSIMISTIC; |
| |
| /** |
| * Abstract test for originating node failure. |
| */ |
| public abstract class IgniteTxPessimisticOriginatingNodeFailureAbstractSelfTest extends GridCacheAbstractSelfTest { |
| /** */ |
| protected static final int GRID_CNT = 5; |
| |
| /** Ignore node ID. */ |
| private volatile Collection<UUID> ignoreMsgNodeIds; |
| |
| /** Ignore message class. */ |
| private Collection<Class<?>> ignoreMsgCls; |
| |
| /** Failing node ID. */ |
| private UUID failingNodeId; |
| |
| /** |
| * @throws Exception If failed. |
| */ |
| @Test |
| public void testManyKeysCommit() throws Exception { |
| Collection<Integer> keys = new ArrayList<>(200); |
| |
| for (int i = 0; i < 200; i++) |
| keys.add(i); |
| |
| testTxOriginatingNodeFails(keys, false); |
| } |
| |
| /** |
| * @throws Exception If failed. |
| */ |
| @Test |
| public void testManyKeysRollback() throws Exception { |
| Collection<Integer> keys = new ArrayList<>(200); |
| |
| for (int i = 0; i < 200; i++) |
| keys.add(i); |
| |
| testTxOriginatingNodeFails(keys, true); |
| } |
| |
| /** |
| * @throws Exception If failed. |
| */ |
| @Test |
| public void testPrimaryNodeFailureCommit() throws Exception { |
| checkPrimaryNodeCrash(true); |
| } |
| |
| /** |
| * @throws Exception If failed. |
| */ |
| @Test |
| public void testPrimaryNodeFailureRollback() throws Exception { |
| checkPrimaryNodeCrash(false); |
| } |
| |
| /** |
| * @return Index of node starting transaction. |
| */ |
| protected int originatingNode() { |
| return 0; |
| } |
| |
| /** |
| * Ignores messages to given node of given type. |
| * |
| * @param dstNodeIds Destination node IDs. |
| * @param msgCls Message type. |
| */ |
| protected void ignoreMessages(Collection<Class<?>> msgCls, Collection<UUID> dstNodeIds) { |
| ignoreMsgNodeIds = dstNodeIds; |
| ignoreMsgCls = msgCls; |
| } |
| |
| /** |
| * Gets ignore message class to simulate partial prepare message. |
| * |
| * @return Ignore message class. |
| */ |
| protected abstract Collection<Class<?>> ignoreMessageClasses(); |
| |
| /** |
| * @param keys Keys to update. |
| * @param fullFailure Flag indicating whether to simulate rollback state. |
| * @throws Exception If failed. |
| */ |
| protected void testTxOriginatingNodeFails(Collection<Integer> keys, final boolean fullFailure) throws Exception { |
| assertFalse(keys.isEmpty()); |
| |
| final Collection<IgniteKernal> grids = new ArrayList<>(); |
| |
| ClusterNode txNode = grid(originatingNode()).localNode(); |
| |
| for (int i = 1; i < gridCount(); i++) |
| grids.add((IgniteKernal)grid(i)); |
| |
| failingNodeId = grid(0).localNode().id(); |
| |
| final Map<Integer, String> map = new HashMap<>(); |
| |
| final String initVal = "initialValue"; |
| |
| for (Integer key : keys) { |
| grid(originatingNode()).cache(DEFAULT_CACHE_NAME).put(key, initVal); |
| |
| map.put(key, String.valueOf(key)); |
| } |
| |
| Map<Integer, Collection<ClusterNode>> nodeMap = new HashMap<>(); |
| |
| info("Node being checked: " + grid(1).localNode().id()); |
| |
| for (Integer key : keys) { |
| Collection<ClusterNode> nodes = new ArrayList<>(); |
| |
| nodes.addAll(grid(1).affinity(DEFAULT_CACHE_NAME).mapKeyToPrimaryAndBackups(key)); |
| |
| nodes.remove(txNode); |
| |
| nodeMap.put(key, nodes); |
| } |
| |
| info("Starting tx [values=" + map + ", topVer=" + |
| ((IgniteKernal)grid(1)).context().discovery().topologyVersion() + ']'); |
| |
| if (fullFailure) |
| ignoreMessages(ignoreMessageClasses(), F.asList(grid(1).localNode().id())); |
| |
| final IgniteEx originatingNodeGrid = grid(originatingNode()); |
| |
| GridTestUtils.runAsync(new Callable<Void>() { |
| @Override public Void call() throws Exception { |
| IgniteCache<Integer, String> cache = originatingNodeGrid.cache(DEFAULT_CACHE_NAME); |
| |
| assertNotNull(cache); |
| |
| Transaction tx = originatingNodeGrid.transactions().txStart(); |
| |
| assertEquals(PESSIMISTIC, tx.concurrency()); |
| |
| try { |
| cache.putAll(map); |
| |
| info("Before commitAsync"); |
| |
| IgniteFuture<?> fut = tx.commitAsync(); |
| |
| info("Got future for commitAsync()."); |
| |
| fut.get(3, TimeUnit.SECONDS); |
| } |
| catch (IgniteFutureTimeoutException ignored) { |
| info("Failed to wait for commit future completion [fullFailure=" + fullFailure + ']'); |
| } |
| |
| return null; |
| } |
| }).get(); |
| |
| info(">>> Stopping originating node " + txNode); |
| |
| G.stop(grid(originatingNode()).name(), true); |
| |
| ignoreMessages(Collections.<Class<?>>emptyList(), Collections.<UUID>emptyList()); |
| |
| info(">>> Stopped originating node: " + txNode.id()); |
| |
| boolean txFinished = GridTestUtils.waitForCondition(new GridAbsPredicate() { |
| @Override public boolean apply() { |
| for (IgniteKernal g : grids) { |
| GridCacheAdapter<?, ?> cache = g.internalCache(DEFAULT_CACHE_NAME); |
| |
| IgniteTxManager txMgr = cache.isNear() ? |
| ((GridNearCacheAdapter)cache).dht().context().tm() : |
| cache.context().tm(); |
| |
| int txNum = txMgr.idMapSize(); |
| |
| if (txNum != 0) |
| return false; |
| } |
| |
| return true; |
| } |
| }, 10000); |
| |
| assertTrue(txFinished); |
| |
| info("Transactions finished."); |
| |
| for (Map.Entry<Integer, Collection<ClusterNode>> e : nodeMap.entrySet()) { |
| final Integer key = e.getKey(); |
| |
| final String val = map.get(key); |
| |
| assertFalse(e.getValue().isEmpty()); |
| |
| for (ClusterNode node : e.getValue()) { |
| final UUID checkNodeId = node.id(); |
| |
| compute(G.ignite(checkNodeId).cluster().forNode(node)).call(new IgniteCallable<Void>() { |
| /** */ |
| @IgniteInstanceResource |
| private Ignite ignite; |
| |
| @Override public Void call() throws Exception { |
| IgniteCache<Integer, String> cache = ignite.cache(DEFAULT_CACHE_NAME); |
| |
| assertNotNull(cache); |
| |
| if (atomicityMode() != TRANSACTIONAL_SNAPSHOT) { |
| assertEquals("Failed to check entry value on node: " + checkNodeId, |
| fullFailure ? initVal : val, cache.localPeek(key)); |
| } |
| |
| return null; |
| } |
| }); |
| } |
| } |
| |
| awaitPartitionMapExchange(); |
| |
| for (Map.Entry<Integer, String> e : map.entrySet()) { |
| long cntr0 = -1; |
| |
| for (Ignite g : G.allGrids()) { |
| Integer key = e.getKey(); |
| |
| assertEquals(fullFailure ? initVal : e.getValue(), g.cache(DEFAULT_CACHE_NAME).get(key)); |
| |
| if (g.affinity(DEFAULT_CACHE_NAME).isPrimaryOrBackup(((IgniteEx)g).localNode(), key)) { |
| long nodeCntr = updateCoutner(g, key); |
| |
| if (cntr0 == -1) |
| cntr0 = nodeCntr; |
| |
| assertEquals(cntr0, nodeCntr); |
| } |
| } |
| } |
| } |
| |
| /** |
| * Checks tx data consistency in case when primary node crashes. |
| * |
| * @param commmit Whether to commit or rollback a transaction. |
| * @throws Exception If failed. |
| */ |
| private void checkPrimaryNodeCrash(final boolean commmit) throws Exception { |
| Set<Integer> keys = new HashSet<>(); |
| |
| for (int i = 0; i < 20; i++) |
| keys.add(i); |
| |
| final Collection<IgniteKernal> grids = new ArrayList<>(); |
| |
| ClusterNode primaryNode = grid(1).localNode(); |
| |
| for (int i = 0; i < gridCount(); i++) { |
| if (i != 1) |
| grids.add((IgniteKernal)grid(i)); |
| } |
| |
| failingNodeId = primaryNode.id(); |
| |
| final Map<Integer, String> map = new HashMap<>(); |
| |
| final String initVal = "initialValue"; |
| |
| for (Integer key : keys) { |
| grid(originatingNode()).cache(DEFAULT_CACHE_NAME).put(key, initVal); |
| |
| map.put(key, String.valueOf(key)); |
| } |
| |
| Map<Integer, Collection<ClusterNode>> nodeMap = new HashMap<>(); |
| |
| IgniteCache<Integer, String> cache = grid(0).cache(DEFAULT_CACHE_NAME); |
| |
| info("Failing node ID: " + grid(1).localNode().id()); |
| |
| for (Integer key : keys) { |
| Collection<ClusterNode> nodes = new ArrayList<>(); |
| |
| nodes.addAll(affinity(cache).mapKeyToPrimaryAndBackups(key)); |
| |
| nodes.remove(primaryNode); |
| |
| nodeMap.put(key, nodes); |
| } |
| |
| info("Starting tx [values=" + map + ", topVer=" + grid(1).context().discovery().topologyVersion() + ']'); |
| |
| assertNotNull(cache); |
| |
| try (Transaction tx = grid(0).transactions().txStart()) { |
| cache.getAll(keys); |
| |
| // Should not send any messages. |
| cache.putAll(map); |
| |
| TransactionProxyImpl txProxy = (TransactionProxyImpl)tx; |
| |
| GridNearTxLocal txEx = txProxy.tx(); |
| |
| assertTrue(txEx.pessimistic()); |
| |
| if (commmit) { |
| txEx.prepare(true); |
| |
| // Fail the node in the middle of transaction. |
| info(">>> Stopping primary node " + primaryNode); |
| |
| G.stop(Ignition.ignite(primaryNode.id()).name(), true); |
| |
| info(">>> Stopped originating node, finishing transaction: " + primaryNode.id()); |
| |
| tx.commit(); |
| } |
| else { |
| // Fail the node in the middle of transaction. |
| info(">>> Stopping primary node " + primaryNode); |
| |
| G.stop(G.ignite(primaryNode.id()).name(), true); |
| |
| info(">>> Stopped originating node, finishing transaction: " + primaryNode.id()); |
| |
| tx.rollback(); |
| } |
| } |
| |
| boolean txFinished = GridTestUtils.waitForCondition(new GridAbsPredicate() { |
| @Override public boolean apply() { |
| for (IgniteKernal g : grids) { |
| GridCacheAdapter<?, ?> cache = g.internalCache(DEFAULT_CACHE_NAME); |
| |
| IgniteTxManager txMgr = cache.isNear() ? |
| ((GridNearCacheAdapter)cache).dht().context().tm() : |
| cache.context().tm(); |
| |
| int txNum = txMgr.idMapSize(); |
| |
| if (txNum != 0) |
| return false; |
| } |
| |
| return true; |
| } |
| }, 10000); |
| |
| assertTrue(txFinished); |
| |
| info("Transactions finished."); |
| |
| for (Map.Entry<Integer, Collection<ClusterNode>> e : nodeMap.entrySet()) { |
| final Integer key = e.getKey(); |
| |
| final String val = map.get(key); |
| |
| assertFalse(e.getValue().isEmpty()); |
| |
| if (atomicityMode() == TRANSACTIONAL_SNAPSHOT) |
| continue; |
| |
| for (ClusterNode node : e.getValue()) { |
| final UUID checkNodeId = node.id(); |
| |
| compute(G.ignite(checkNodeId).cluster().forNode(node)).call(new IgniteCallable<Void>() { |
| /** */ |
| @IgniteInstanceResource |
| private Ignite ignite; |
| |
| @Override public Void call() throws Exception { |
| IgniteCache<Integer, String> cache = ignite.cache(DEFAULT_CACHE_NAME); |
| |
| assertNotNull(cache); |
| |
| assertEquals("Failed to check entry value on node: " + checkNodeId, |
| !commmit ? initVal : val, cache.localPeek(key)); |
| |
| return null; |
| } |
| }); |
| } |
| } |
| |
| awaitPartitionMapExchange(); |
| |
| for (Map.Entry<Integer, String> e : map.entrySet()) { |
| long cntr0 = -1; |
| |
| for (Ignite g : G.allGrids()) { |
| Integer key = e.getKey(); |
| |
| assertEquals(!commmit ? initVal : e.getValue(), g.cache(DEFAULT_CACHE_NAME).get(key)); |
| |
| if (g.affinity(DEFAULT_CACHE_NAME).isPrimaryOrBackup(((IgniteEx)g).localNode(), key)) { |
| long nodeCntr = updateCoutner(g, key); |
| |
| if (cntr0 == -1) |
| cntr0 = nodeCntr; |
| |
| assertEquals(cntr0, nodeCntr); |
| } |
| } |
| } |
| } |
| |
| /** |
| * @return All node IDs. |
| */ |
| private Collection<UUID> allNodeIds() { |
| Collection<UUID> nodeIds = new ArrayList<>(gridCount()); |
| |
| for (int i = 0; i < gridCount(); i++) |
| nodeIds.add(grid(i).localNode().id()); |
| |
| return nodeIds; |
| } |
| |
| /** {@inheritDoc} */ |
| @Override protected IgniteConfiguration getConfiguration(String igniteInstanceName) throws Exception { |
| IgniteConfiguration cfg = super.getConfiguration(igniteInstanceName); |
| |
| cfg.setCommunicationSpi(new TcpCommunicationSpi() { |
| @Override public void sendMessage(ClusterNode node, Message msg, |
| IgniteInClosure<IgniteException> ackClosure) throws IgniteSpiException { |
| if (getSpiContext().localNode().id().equals(failingNodeId)) { |
| if (ignoredMessage((GridIoMessage)msg) && ignoreMsgNodeIds != null) { |
| for (UUID ignored : ignoreMsgNodeIds) { |
| if (node.id().equals(ignored)) |
| return; |
| } |
| } |
| } |
| |
| super.sendMessage(node, msg, ackClosure); |
| } |
| }); |
| |
| cfg.getTransactionConfiguration().setDefaultTxConcurrency(PESSIMISTIC); |
| |
| return cfg; |
| } |
| |
| /** {@inheritDoc} */ |
| @Override protected CacheConfiguration cacheConfiguration(String igniteInstanceName) throws Exception { |
| CacheConfiguration cfg = super.cacheConfiguration(igniteInstanceName); |
| |
| cfg.setCacheStoreFactory(null); |
| cfg.setReadThrough(false); |
| cfg.setWriteThrough(false); |
| |
| return cfg; |
| } |
| |
| /** {@inheritDoc} */ |
| @Override protected int gridCount() { |
| return GRID_CNT; |
| } |
| |
| /** {@inheritDoc} */ |
| @Override protected abstract CacheMode cacheMode(); |
| |
| /** {@inheritDoc} */ |
| @Override protected void beforeTestsStarted() throws Exception { |
| // No-op. |
| } |
| |
| /** {@inheritDoc} */ |
| @Override protected void beforeTest() throws Exception { |
| startGridsMultiThreaded(GRID_CNT); |
| } |
| |
| /** {@inheritDoc} */ |
| @Override protected void afterTestsStopped() throws Exception { |
| // No-op |
| } |
| |
| /** {@inheritDoc} */ |
| @Override protected void afterTest() throws Exception { |
| stopAllGrids(); |
| |
| ignoreMsgCls = null; |
| ignoreMsgNodeIds = null; |
| } |
| |
| /** |
| * Checks if message should be ignored. |
| * |
| * @param msg Message. |
| * @return {@code True} if message should be ignored. |
| */ |
| private boolean ignoredMessage(GridIoMessage msg) { |
| Collection<Class<?>> ignoreClss = ignoreMsgCls; |
| |
| if (ignoreClss != null) { |
| for (Class<?> ignoreCls : ignoreClss) { |
| if (ignoreCls.isAssignableFrom(msg.message().getClass())) |
| return true; |
| } |
| |
| return false; |
| } |
| else |
| return false; |
| } |
| |
| /** */ |
| private static long updateCoutner(Ignite ign, Object key) { |
| return dataStore(((IgniteEx)ign).cachex(DEFAULT_CACHE_NAME).context(), key) |
| .map(IgniteCacheOffheapManager.CacheDataStore::updateCounter) |
| .orElse(0L); |
| } |
| |
| /** */ |
| private static Optional<IgniteCacheOffheapManager.CacheDataStore> dataStore( |
| GridCacheContext<?, ?> cctx, Object key) { |
| int p = cctx.affinity().partition(key); |
| |
| return StreamSupport.stream(cctx.offheap().cacheDataStores().spliterator(), false) |
| .filter(ds -> ds.partId() == p) |
| .findFirst(); |
| } |
| } |