blob: adcfd1ff96c66806281a9a8d9826c478bd05376d [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.cassandra.distributed.upgrade;
import java.util.UUID;
import java.util.concurrent.CompletableFuture;
import java.util.concurrent.RejectedExecutionException;
import java.util.concurrent.TimeUnit;
import java.util.concurrent.TimeoutException;
import org.junit.Assert;
import org.junit.Test;
import org.apache.cassandra.distributed.UpgradeableCluster;
import org.apache.cassandra.distributed.api.IUpgradeableInstance;
import static org.apache.cassandra.distributed.api.Feature.GOSSIP;
import static org.apache.cassandra.distributed.api.Feature.NETWORK;
import static org.apache.cassandra.distributed.shared.AssertUtils.assertRows;
import static org.apache.cassandra.distributed.shared.AssertUtils.fail;
import static org.apache.cassandra.distributed.shared.AssertUtils.row;
public class MixedModeRepairTest extends UpgradeTestBase
{
public static final int UPGRADED_NODE = 1;
public static final String CREATE_TABLE = withKeyspace("CREATE TABLE %s.t (k uuid, c int, v int, PRIMARY KEY (k, c))");
public static final String INSERT = withKeyspace("INSERT INTO %s.t (k, c, v) VALUES (?, ?, ?)");
public static final String SELECT = withKeyspace("SELECT * FROM %s.t WHERE k=?");
/**
* Test that repairs fail during a major upgrade. If the repaired node is >= 4.0 thanks to CASSANDRA-13944 there
* will be an informative message. Otherwise, if the repaired node is below 4.0, there won't be such an informative
* message and the repair will take very long to timeout.
*/
@Test
public void testRepairDuringMajorUpgrade() throws Throwable
{
new UpgradeTestBase.TestCase()
.nodes(2)
.nodesToUpgrade(UPGRADED_NODE)
.upgradesFrom(v3X)
.withConfig(config -> config.with(NETWORK, GOSSIP))
.setup(cluster -> {
cluster.schemaChange(CREATE_TABLE);
cluster.setUncaughtExceptionsFilter(throwable -> throwable instanceof RejectedExecutionException);
})
.runAfterNodeUpgrade((cluster, node) -> {
// run the repair scenario in both the upgraded and the not upgraded node
for (int repairedNode = 1; repairedNode <= cluster.size(); repairedNode++)
{
UUID key = UUID.randomUUID();
// only in node 1, create a sstable with a version of a partition
Object[] row1 = row(key, 10, 100);
cluster.get(1).executeInternal(INSERT, row1);
cluster.get(1).flush(KEYSPACE);
// only in node 2, create a sstable with another version of the partition
Object[] row2 = row(key, 20, 200);
cluster.get(2).executeInternal(INSERT, row2);
cluster.get(2).flush(KEYSPACE);
// in case of repairing the upgraded node the repair should be rejected with a decriptive error in both
// nodetool output and logs (see CASSANDRA-13944)
if (repairedNode == UPGRADED_NODE)
{
String errorMessage = "Repair is not supported in mixed major version clusters";
cluster.get(repairedNode)
.nodetoolResult("repair", "--full", KEYSPACE)
.asserts()
.errorContains(errorMessage);
assertLogHas(cluster, repairedNode, errorMessage);
}
// if the node issuing the repair is the not updated node we don't have specific error management,
// so the repair will produce a failure in the upgraded node, and it will take one hour to time out in
// the not upgraded node. Since we don't want to wait that long, we only wait a few seconds for the
// repair before verifying the "unknown verb id" error in the upgraded node.
else
{
try
{
IUpgradeableInstance instance = cluster.get(repairedNode);
CompletableFuture.supplyAsync(() -> instance.nodetoolResult("repair", "--full", KEYSPACE))
.get(10, TimeUnit.SECONDS);
fail("Repair in the not upgraded node should have timed out");
}
catch (TimeoutException e)
{
assertLogHas(cluster, UPGRADED_NODE, "unexpected exception caught while processing inbound messages");
assertLogHas(cluster, UPGRADED_NODE, "java.lang.IllegalArgumentException: Unknown verb id");
}
}
// verify that the previous failed repair hasn't repaired the data
assertRows(cluster.get(1).executeInternal(SELECT, key), row1);
assertRows(cluster.get(2).executeInternal(SELECT, key), row2);
}
})
.run();
}
private static void assertLogHas(UpgradeableCluster cluster, int node, String msg)
{
Assert.assertFalse("Unable to find '" + msg + "' in the logs of node " + node,
cluster.get(node).logs().grep(msg).getResult().isEmpty());
}
}