blob: 8186385efb82d4f6bf7733076ef9b1e8296aa44b [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.ignite.internal.processors.cache.distributed;
import java.util.ArrayList;
import java.util.Collection;
import java.util.Collections;
import java.util.HashMap;
import java.util.HashSet;
import java.util.Map;
import java.util.Optional;
import java.util.Set;
import java.util.UUID;
import java.util.concurrent.Callable;
import java.util.concurrent.TimeUnit;
import java.util.stream.StreamSupport;
import org.apache.ignite.Ignite;
import org.apache.ignite.IgniteCache;
import org.apache.ignite.IgniteException;
import org.apache.ignite.Ignition;
import org.apache.ignite.cache.CacheMode;
import org.apache.ignite.cluster.ClusterNode;
import org.apache.ignite.configuration.CacheConfiguration;
import org.apache.ignite.configuration.IgniteConfiguration;
import org.apache.ignite.internal.IgniteEx;
import org.apache.ignite.internal.IgniteKernal;
import org.apache.ignite.internal.managers.communication.GridIoMessage;
import org.apache.ignite.internal.processors.cache.GridCacheAbstractSelfTest;
import org.apache.ignite.internal.processors.cache.GridCacheAdapter;
import org.apache.ignite.internal.processors.cache.GridCacheContext;
import org.apache.ignite.internal.processors.cache.IgniteCacheOffheapManager;
import org.apache.ignite.internal.processors.cache.distributed.near.GridNearCacheAdapter;
import org.apache.ignite.internal.processors.cache.distributed.near.GridNearTxLocal;
import org.apache.ignite.internal.processors.cache.transactions.IgniteTxManager;
import org.apache.ignite.internal.processors.cache.transactions.TransactionProxyImpl;
import org.apache.ignite.internal.util.lang.GridAbsPredicate;
import org.apache.ignite.internal.util.typedef.F;
import org.apache.ignite.internal.util.typedef.G;
import org.apache.ignite.lang.IgniteCallable;
import org.apache.ignite.lang.IgniteFuture;
import org.apache.ignite.lang.IgniteFutureTimeoutException;
import org.apache.ignite.lang.IgniteInClosure;
import org.apache.ignite.plugin.extensions.communication.Message;
import org.apache.ignite.resources.IgniteInstanceResource;
import org.apache.ignite.spi.IgniteSpiException;
import org.apache.ignite.spi.communication.tcp.TcpCommunicationSpi;
import org.apache.ignite.testframework.GridTestUtils;
import org.apache.ignite.transactions.Transaction;
import org.junit.Test;
import static org.apache.ignite.cache.CacheAtomicityMode.TRANSACTIONAL_SNAPSHOT;
import static org.apache.ignite.transactions.TransactionConcurrency.PESSIMISTIC;
/**
* Abstract test for originating node failure.
*/
public abstract class IgniteTxPessimisticOriginatingNodeFailureAbstractSelfTest extends GridCacheAbstractSelfTest {
/** */
protected static final int GRID_CNT = 5;
/** Ignore node ID. */
private volatile Collection<UUID> ignoreMsgNodeIds;
/** Ignore message class. */
private Collection<Class<?>> ignoreMsgCls;
/** Failing node ID. */
private UUID failingNodeId;
/**
* @throws Exception If failed.
*/
@Test
public void testManyKeysCommit() throws Exception {
Collection<Integer> keys = new ArrayList<>(200);
for (int i = 0; i < 200; i++)
keys.add(i);
testTxOriginatingNodeFails(keys, false);
}
/**
* @throws Exception If failed.
*/
@Test
public void testManyKeysRollback() throws Exception {
Collection<Integer> keys = new ArrayList<>(200);
for (int i = 0; i < 200; i++)
keys.add(i);
testTxOriginatingNodeFails(keys, true);
}
/**
* @throws Exception If failed.
*/
@Test
public void testPrimaryNodeFailureCommit() throws Exception {
checkPrimaryNodeCrash(true);
}
/**
* @throws Exception If failed.
*/
@Test
public void testPrimaryNodeFailureRollback() throws Exception {
checkPrimaryNodeCrash(false);
}
/**
* @return Index of node starting transaction.
*/
protected int originatingNode() {
return 0;
}
/**
* Ignores messages to given node of given type.
*
* @param dstNodeIds Destination node IDs.
* @param msgCls Message type.
*/
protected void ignoreMessages(Collection<Class<?>> msgCls, Collection<UUID> dstNodeIds) {
ignoreMsgNodeIds = dstNodeIds;
ignoreMsgCls = msgCls;
}
/**
* Gets ignore message class to simulate partial prepare message.
*
* @return Ignore message class.
*/
protected abstract Collection<Class<?>> ignoreMessageClasses();
/**
* @param keys Keys to update.
* @param fullFailure Flag indicating whether to simulate rollback state.
* @throws Exception If failed.
*/
protected void testTxOriginatingNodeFails(Collection<Integer> keys, final boolean fullFailure) throws Exception {
assertFalse(keys.isEmpty());
final Collection<IgniteKernal> grids = new ArrayList<>();
ClusterNode txNode = grid(originatingNode()).localNode();
for (int i = 1; i < gridCount(); i++)
grids.add((IgniteKernal)grid(i));
failingNodeId = grid(0).localNode().id();
final Map<Integer, String> map = new HashMap<>();
final String initVal = "initialValue";
for (Integer key : keys) {
grid(originatingNode()).cache(DEFAULT_CACHE_NAME).put(key, initVal);
map.put(key, String.valueOf(key));
}
Map<Integer, Collection<ClusterNode>> nodeMap = new HashMap<>();
info("Node being checked: " + grid(1).localNode().id());
for (Integer key : keys) {
Collection<ClusterNode> nodes = new ArrayList<>();
nodes.addAll(grid(1).affinity(DEFAULT_CACHE_NAME).mapKeyToPrimaryAndBackups(key));
nodes.remove(txNode);
nodeMap.put(key, nodes);
}
info("Starting tx [values=" + map + ", topVer=" +
((IgniteKernal)grid(1)).context().discovery().topologyVersion() + ']');
if (fullFailure)
ignoreMessages(ignoreMessageClasses(), F.asList(grid(1).localNode().id()));
final IgniteEx originatingNodeGrid = grid(originatingNode());
GridTestUtils.runAsync(new Callable<Void>() {
@Override public Void call() throws Exception {
IgniteCache<Integer, String> cache = originatingNodeGrid.cache(DEFAULT_CACHE_NAME);
assertNotNull(cache);
Transaction tx = originatingNodeGrid.transactions().txStart();
assertEquals(PESSIMISTIC, tx.concurrency());
try {
cache.putAll(map);
info("Before commitAsync");
IgniteFuture<?> fut = tx.commitAsync();
info("Got future for commitAsync().");
fut.get(3, TimeUnit.SECONDS);
}
catch (IgniteFutureTimeoutException ignored) {
info("Failed to wait for commit future completion [fullFailure=" + fullFailure + ']');
}
return null;
}
}).get();
info(">>> Stopping originating node " + txNode);
G.stop(grid(originatingNode()).name(), true);
ignoreMessages(Collections.<Class<?>>emptyList(), Collections.<UUID>emptyList());
info(">>> Stopped originating node: " + txNode.id());
boolean txFinished = GridTestUtils.waitForCondition(new GridAbsPredicate() {
@Override public boolean apply() {
for (IgniteKernal g : grids) {
GridCacheAdapter<?, ?> cache = g.internalCache(DEFAULT_CACHE_NAME);
IgniteTxManager txMgr = cache.isNear() ?
((GridNearCacheAdapter)cache).dht().context().tm() :
cache.context().tm();
int txNum = txMgr.idMapSize();
if (txNum != 0)
return false;
}
return true;
}
}, 10000);
assertTrue(txFinished);
info("Transactions finished.");
for (Map.Entry<Integer, Collection<ClusterNode>> e : nodeMap.entrySet()) {
final Integer key = e.getKey();
final String val = map.get(key);
assertFalse(e.getValue().isEmpty());
for (ClusterNode node : e.getValue()) {
final UUID checkNodeId = node.id();
compute(G.ignite(checkNodeId).cluster().forNode(node)).call(new IgniteCallable<Void>() {
/** */
@IgniteInstanceResource
private Ignite ignite;
@Override public Void call() throws Exception {
IgniteCache<Integer, String> cache = ignite.cache(DEFAULT_CACHE_NAME);
assertNotNull(cache);
if (atomicityMode() != TRANSACTIONAL_SNAPSHOT) {
assertEquals("Failed to check entry value on node: " + checkNodeId,
fullFailure ? initVal : val, cache.localPeek(key));
}
return null;
}
});
}
}
awaitPartitionMapExchange();
for (Map.Entry<Integer, String> e : map.entrySet()) {
long cntr0 = -1;
for (Ignite g : G.allGrids()) {
Integer key = e.getKey();
assertEquals(fullFailure ? initVal : e.getValue(), g.cache(DEFAULT_CACHE_NAME).get(key));
if (g.affinity(DEFAULT_CACHE_NAME).isPrimaryOrBackup(((IgniteEx)g).localNode(), key)) {
long nodeCntr = updateCoutner(g, key);
if (cntr0 == -1)
cntr0 = nodeCntr;
assertEquals(cntr0, nodeCntr);
}
}
}
}
/**
* Checks tx data consistency in case when primary node crashes.
*
* @param commmit Whether to commit or rollback a transaction.
* @throws Exception If failed.
*/
private void checkPrimaryNodeCrash(final boolean commmit) throws Exception {
Set<Integer> keys = new HashSet<>();
for (int i = 0; i < 20; i++)
keys.add(i);
final Collection<IgniteKernal> grids = new ArrayList<>();
ClusterNode primaryNode = grid(1).localNode();
for (int i = 0; i < gridCount(); i++) {
if (i != 1)
grids.add((IgniteKernal)grid(i));
}
failingNodeId = primaryNode.id();
final Map<Integer, String> map = new HashMap<>();
final String initVal = "initialValue";
for (Integer key : keys) {
grid(originatingNode()).cache(DEFAULT_CACHE_NAME).put(key, initVal);
map.put(key, String.valueOf(key));
}
Map<Integer, Collection<ClusterNode>> nodeMap = new HashMap<>();
IgniteCache<Integer, String> cache = grid(0).cache(DEFAULT_CACHE_NAME);
info("Failing node ID: " + grid(1).localNode().id());
for (Integer key : keys) {
Collection<ClusterNode> nodes = new ArrayList<>();
nodes.addAll(affinity(cache).mapKeyToPrimaryAndBackups(key));
nodes.remove(primaryNode);
nodeMap.put(key, nodes);
}
info("Starting tx [values=" + map + ", topVer=" + grid(1).context().discovery().topologyVersion() + ']');
assertNotNull(cache);
try (Transaction tx = grid(0).transactions().txStart()) {
cache.getAll(keys);
// Should not send any messages.
cache.putAll(map);
TransactionProxyImpl txProxy = (TransactionProxyImpl)tx;
GridNearTxLocal txEx = txProxy.tx();
assertTrue(txEx.pessimistic());
if (commmit) {
txEx.prepare(true);
// Fail the node in the middle of transaction.
info(">>> Stopping primary node " + primaryNode);
G.stop(Ignition.ignite(primaryNode.id()).name(), true);
info(">>> Stopped originating node, finishing transaction: " + primaryNode.id());
tx.commit();
}
else {
// Fail the node in the middle of transaction.
info(">>> Stopping primary node " + primaryNode);
G.stop(G.ignite(primaryNode.id()).name(), true);
info(">>> Stopped originating node, finishing transaction: " + primaryNode.id());
tx.rollback();
}
}
boolean txFinished = GridTestUtils.waitForCondition(new GridAbsPredicate() {
@Override public boolean apply() {
for (IgniteKernal g : grids) {
GridCacheAdapter<?, ?> cache = g.internalCache(DEFAULT_CACHE_NAME);
IgniteTxManager txMgr = cache.isNear() ?
((GridNearCacheAdapter)cache).dht().context().tm() :
cache.context().tm();
int txNum = txMgr.idMapSize();
if (txNum != 0)
return false;
}
return true;
}
}, 10000);
assertTrue(txFinished);
info("Transactions finished.");
for (Map.Entry<Integer, Collection<ClusterNode>> e : nodeMap.entrySet()) {
final Integer key = e.getKey();
final String val = map.get(key);
assertFalse(e.getValue().isEmpty());
if (atomicityMode() == TRANSACTIONAL_SNAPSHOT)
continue;
for (ClusterNode node : e.getValue()) {
final UUID checkNodeId = node.id();
compute(G.ignite(checkNodeId).cluster().forNode(node)).call(new IgniteCallable<Void>() {
/** */
@IgniteInstanceResource
private Ignite ignite;
@Override public Void call() throws Exception {
IgniteCache<Integer, String> cache = ignite.cache(DEFAULT_CACHE_NAME);
assertNotNull(cache);
assertEquals("Failed to check entry value on node: " + checkNodeId,
!commmit ? initVal : val, cache.localPeek(key));
return null;
}
});
}
}
awaitPartitionMapExchange();
for (Map.Entry<Integer, String> e : map.entrySet()) {
long cntr0 = -1;
for (Ignite g : G.allGrids()) {
Integer key = e.getKey();
assertEquals(!commmit ? initVal : e.getValue(), g.cache(DEFAULT_CACHE_NAME).get(key));
if (g.affinity(DEFAULT_CACHE_NAME).isPrimaryOrBackup(((IgniteEx)g).localNode(), key)) {
long nodeCntr = updateCoutner(g, key);
if (cntr0 == -1)
cntr0 = nodeCntr;
assertEquals(cntr0, nodeCntr);
}
}
}
}
/**
* @return All node IDs.
*/
private Collection<UUID> allNodeIds() {
Collection<UUID> nodeIds = new ArrayList<>(gridCount());
for (int i = 0; i < gridCount(); i++)
nodeIds.add(grid(i).localNode().id());
return nodeIds;
}
/** {@inheritDoc} */
@Override protected IgniteConfiguration getConfiguration(String igniteInstanceName) throws Exception {
IgniteConfiguration cfg = super.getConfiguration(igniteInstanceName);
cfg.setCommunicationSpi(new TcpCommunicationSpi() {
@Override public void sendMessage(ClusterNode node, Message msg,
IgniteInClosure<IgniteException> ackClosure) throws IgniteSpiException {
if (getSpiContext().localNode().id().equals(failingNodeId)) {
if (ignoredMessage((GridIoMessage)msg) && ignoreMsgNodeIds != null) {
for (UUID ignored : ignoreMsgNodeIds) {
if (node.id().equals(ignored))
return;
}
}
}
super.sendMessage(node, msg, ackClosure);
}
});
cfg.getTransactionConfiguration().setDefaultTxConcurrency(PESSIMISTIC);
return cfg;
}
/** {@inheritDoc} */
@Override protected CacheConfiguration cacheConfiguration(String igniteInstanceName) throws Exception {
CacheConfiguration cfg = super.cacheConfiguration(igniteInstanceName);
cfg.setCacheStoreFactory(null);
cfg.setReadThrough(false);
cfg.setWriteThrough(false);
return cfg;
}
/** {@inheritDoc} */
@Override protected int gridCount() {
return GRID_CNT;
}
/** {@inheritDoc} */
@Override protected abstract CacheMode cacheMode();
/** {@inheritDoc} */
@Override protected void beforeTestsStarted() throws Exception {
// No-op.
}
/** {@inheritDoc} */
@Override protected void beforeTest() throws Exception {
startGridsMultiThreaded(GRID_CNT);
}
/** {@inheritDoc} */
@Override protected void afterTestsStopped() throws Exception {
// No-op
}
/** {@inheritDoc} */
@Override protected void afterTest() throws Exception {
stopAllGrids();
ignoreMsgCls = null;
ignoreMsgNodeIds = null;
}
/**
* Checks if message should be ignored.
*
* @param msg Message.
* @return {@code True} if message should be ignored.
*/
private boolean ignoredMessage(GridIoMessage msg) {
Collection<Class<?>> ignoreClss = ignoreMsgCls;
if (ignoreClss != null) {
for (Class<?> ignoreCls : ignoreClss) {
if (ignoreCls.isAssignableFrom(msg.message().getClass()))
return true;
}
return false;
}
else
return false;
}
/** */
private static long updateCoutner(Ignite ign, Object key) {
return dataStore(((IgniteEx)ign).cachex(DEFAULT_CACHE_NAME).context(), key)
.map(IgniteCacheOffheapManager.CacheDataStore::updateCounter)
.orElse(0L);
}
/** */
private static Optional<IgniteCacheOffheapManager.CacheDataStore> dataStore(
GridCacheContext<?, ?> cctx, Object key) {
int p = cctx.affinity().partition(key);
return StreamSupport.stream(cctx.offheap().cacheDataStores().spliterator(), false)
.filter(ds -> ds.partId() == p)
.findFirst();
}
}