blob: 8a666fcf51ebcfa1ab58443c20073d846e44720f [file] [log] [blame]
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
package org.apache.cassandra.db;
import java.math.BigInteger;
import java.nio.ByteBuffer;
import java.nio.charset.CharacterCodingException;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.Iterator;
import java.util.List;
import org.junit.BeforeClass;
import org.junit.Test;
import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertTrue;
import org.apache.cassandra.*;
import org.apache.cassandra.config.DatabaseDescriptor;
import org.apache.cassandra.db.marshal.AsciiType;
import org.apache.cassandra.db.rows.Row;
import org.apache.cassandra.db.marshal.IntegerType;
import org.apache.cassandra.db.partitions.*;
import org.apache.cassandra.dht.IPartitioner;
import org.apache.cassandra.dht.Range;
import org.apache.cassandra.dht.Token;
import org.apache.cassandra.exceptions.ConfigurationException;
import org.apache.cassandra.locator.ReplicaPlan;
import org.apache.cassandra.locator.ReplicaPlans;
import org.apache.cassandra.locator.TokenMetadata;
import org.apache.cassandra.schema.ColumnMetadata;
import org.apache.cassandra.schema.KeyspaceParams;
import org.apache.cassandra.schema.TableMetadata;
import org.apache.cassandra.service.StorageProxy;
import org.apache.cassandra.service.StorageService;
import org.apache.cassandra.utils.ByteBufferUtil;
import org.apache.cassandra.utils.FBUtilities;
public class PartitionRangeReadTest
public static final String KEYSPACE1 = "PartitionRangeReadTest1";
public static final String KEYSPACE2 = "PartitionRangeReadTest2";
public static final String CF_STANDARD1 = "Standard1";
public static final String CF_STANDARDINT = "StandardInteger1";
public static final String CF_COMPACT1 = "Compact1";
public static void defineSchema() throws ConfigurationException
SchemaLoader.standardCFMD(KEYSPACE1, CF_STANDARD1),
SchemaLoader.denseCFMD(KEYSPACE1, CF_STANDARDINT, IntegerType.instance),
TableMetadata.builder(KEYSPACE1, CF_COMPACT1)
.addPartitionKeyColumn("key", AsciiType.instance)
.addClusteringColumn("column1", AsciiType.instance)
.addRegularColumn("value", AsciiType.instance)
.addStaticColumn("val", AsciiType.instance));
SchemaLoader.standardCFMD(KEYSPACE2, CF_STANDARD1));
public void testInclusiveBounds()
ColumnFamilyStore cfs =;
new RowUpdateBuilder(cfs.metadata(), 0, ByteBufferUtil.bytes("key1"))
.add("val", "asdf").build().applyUnsafe();
new RowUpdateBuilder(cfs.metadata(), 0, ByteBufferUtil.bytes("key2"))
.add("val", "asdf").build().applyUnsafe();
assertEquals(2, Util.getAll(Util.cmd(cfs).fromIncl("cc1").toIncl("cc2").build()).size());
public void testCassandra6778() throws CharacterCodingException
String cfname = CF_STANDARDINT;
Keyspace keyspace =;
ColumnFamilyStore cfs = keyspace.getColumnFamilyStore(cfname);
ByteBuffer col = ByteBufferUtil.bytes("val");
ColumnMetadata cDef = cfs.metadata().getColumn(col);
// insert two columns that represent the same integer but have different binary forms (the
// second one is padded with extra zeros)
new RowUpdateBuilder(cfs.metadata(), 0, "k1")
.clustering(new BigInteger(new byte[]{1}))
.add("val", "val1")
new RowUpdateBuilder(cfs.metadata(), 1, "k1")
.clustering(new BigInteger(new byte[]{0, 0, 1}))
.add("val", "val2")
// fetch by the first column name; we should get the second version of the column value
Row row = Util.getOnlyRow(Util.cmd(cfs, "k1").includeRow(new BigInteger(new byte[]{1})).build());
// fetch by the second column name; we should get the second version of the column value
row = Util.getOnlyRow(Util.cmd(cfs, "k1").includeRow(new BigInteger(new byte[]{0, 0, 1})).build());
public void testLimits()
ColumnFamilyStore cfs =;
for (int i = 0; i < 10; i++)
new RowUpdateBuilder(cfs.metadata(), 0, Integer.toString(i))
.add("val", "abcd")
new RowUpdateBuilder(cfs.metadata(), 0, Integer.toString(i))
.add("value", "")
assertEquals(10, Util.getAll(Util.cmd(cfs).build()).size());
for (int i = 0; i < 10; i++)
assertEquals(i, Util.getAll(Util.cmd(cfs).withLimit(i).build()).size());
public void testRangeSliceInclusionExclusion() throws Throwable
String keyspaceName = KEYSPACE1;
String cfName = CF_STANDARD1;
Keyspace keyspace =;
ColumnFamilyStore cfs = keyspace.getColumnFamilyStore(cfName);
for (int i = 0; i < 10; ++i)
RowUpdateBuilder builder = new RowUpdateBuilder(cfs.metadata(), 10, String.valueOf(i));
builder.add("val", String.valueOf(i));;
ColumnMetadata cDef = cfs.metadata().getColumn(ByteBufferUtil.bytes("val"));
List<FilteredPartition> partitions;
// Start and end inclusive
partitions = Util.getAll(Util.cmd(cfs).fromKeyIncl("2").toKeyIncl("7").build());
assertEquals(6, partitions.size());
assertTrue(partitions.get(partitions.size() - 1).iterator().next().getCell(cDef).value().equals(ByteBufferUtil.bytes("7")));
// Start and end excluded
partitions = Util.getAll(Util.cmd(cfs).fromKeyExcl("2").toKeyExcl("7").build());
assertEquals(4, partitions.size());
assertTrue(partitions.get(partitions.size() - 1).iterator().next().getCell(cDef).value().equals(ByteBufferUtil.bytes("6")));
// Start excluded, end included
partitions = Util.getAll(Util.cmd(cfs).fromKeyExcl("2").toKeyIncl("7").build());
assertEquals(5, partitions.size());
assertTrue(partitions.get(partitions.size() - 1).iterator().next().getCell(cDef).value().equals(ByteBufferUtil.bytes("7")));
// Start included, end excluded
partitions = Util.getAll(Util.cmd(cfs).fromKeyIncl("2").toKeyExcl("7").build());
assertEquals(5, partitions.size());
assertTrue(partitions.get(partitions.size() - 1).iterator().next().getCell(cDef).value().equals(ByteBufferUtil.bytes("6")));
public void testComputeConcurrencyFactor()
int maxConcurrentRangeRequest = 32;
// no live row returned, fetch all remaining ranges but hit the max instead
int cf = StorageProxy.RangeCommandIterator.computeConcurrencyFactor(100, 30, maxConcurrentRangeRequest, 500, 0);
assertEquals(maxConcurrentRangeRequest, cf); // because 100 - 30 = 70 > maxConccurrentRangeRequest
// no live row returned, fetch all remaining ranges
cf = StorageProxy.RangeCommandIterator.computeConcurrencyFactor(100, 80, maxConcurrentRangeRequest, 500, 0);
assertEquals(20, cf); // because 100-80 = 20 < maxConccurrentRangeRequest
// returned half rows, fetch rangesQueried again but hit the max instead
cf = StorageProxy.RangeCommandIterator.computeConcurrencyFactor(100, 60, maxConcurrentRangeRequest, 480, 240);
assertEquals(maxConcurrentRangeRequest, cf); // because 60 > maxConccurrentRangeRequest
// returned half rows, fetch rangesQueried again
cf = StorageProxy.RangeCommandIterator.computeConcurrencyFactor(100, 30, maxConcurrentRangeRequest, 480, 240);
assertEquals(30, cf); // because 30 < maxConccurrentRangeRequest
// returned most of rows, 1 more range to fetch
cf = StorageProxy.RangeCommandIterator.computeConcurrencyFactor(100, 1, maxConcurrentRangeRequest, 480, 479);
assertEquals(1, cf); // because 1 < maxConccurrentRangeRequest
public void testRangeCountWithRangeMerge()
List<Token> tokens = setTokens(Arrays.asList(100, 200, 300, 400));
int vnodeCount = 0;
Keyspace keyspace =;
List<ReplicaPlan.ForRangeRead> ranges = new ArrayList<>();
for (int i = 0; i + 1 < tokens.size(); i++)
Range<PartitionPosition> range = Range.makeRowRange(tokens.get(i), tokens.get(i + 1));
ranges.add(ReplicaPlans.forRangeRead(keyspace, ConsistencyLevel.ONE, range, 1));
StorageProxy.RangeMerger merge = new StorageProxy.RangeMerger(ranges.iterator(), keyspace, ConsistencyLevel.ONE);
ReplicaPlan.ForRangeRead mergedRange = Iterators.getOnlyElement(merge);
// all ranges are merged as test has only one node.
assertEquals(vnodeCount, mergedRange.vnodeCount());
public void testRangeQueried()
List<Token> tokens = setTokens(Arrays.asList(100, 200, 300, 400));
int vnodeCount = tokens.size() + 1; // n tokens divide token ring into n+1 ranges
Keyspace keyspace =;
ColumnFamilyStore cfs = keyspace.getColumnFamilyStore(CF_STANDARD1);
int rows = 100;
for (int i = 0; i < rows; ++i)
RowUpdateBuilder builder = new RowUpdateBuilder(cfs.metadata(), 10, String.valueOf(i));
builder.add("val", String.valueOf(i));;
PartitionRangeReadCommand command = (PartitionRangeReadCommand) Util.cmd(cfs).build();
// without range merger, there will be 2 batches requested: 1st batch with 1 range and 2nd batch with remaining ranges
Iterator<ReplicaPlan.ForRangeRead> ranges = rangeIterator(command, keyspace, false);
StorageProxy.RangeCommandIterator data = new StorageProxy.RangeCommandIterator(ranges, command, 1, 1000, vnodeCount, System.nanoTime());
verifyRangeCommandIterator(data, rows, 2, vnodeCount);
// without range merger and initial cf=5, there will be 1 batches requested: 5 vnode ranges for 1st batch
ranges = rangeIterator(command, keyspace, false);
data = new StorageProxy.RangeCommandIterator(ranges, command, vnodeCount, 1000, vnodeCount, System.nanoTime());
verifyRangeCommandIterator(data, rows, 1, vnodeCount);
// without range merger and max cf=1, there will be 5 batches requested: 1 vnode range per batch
ranges = rangeIterator(command, keyspace, false);
data = new StorageProxy.RangeCommandIterator(ranges, command, 1, 1, vnodeCount, System.nanoTime());
verifyRangeCommandIterator(data, rows, vnodeCount, vnodeCount);
// with range merger, there will be only 1 batch requested, as all ranges share the same replica - localhost
ranges = rangeIterator(command, keyspace, true);
data = new StorageProxy.RangeCommandIterator(ranges, command, 1, 1000, vnodeCount, System.nanoTime());
verifyRangeCommandIterator(data, rows, 1, vnodeCount);
// with range merger and max cf=1, there will be only 1 batch requested, as all ranges share the same replica - localhost
ranges = rangeIterator(command, keyspace, true);
data = new StorageProxy.RangeCommandIterator(ranges, command, 1, 1, vnodeCount, System.nanoTime());
verifyRangeCommandIterator(data, rows, 1, vnodeCount);
private Iterator<ReplicaPlan.ForRangeRead> rangeIterator(PartitionRangeReadCommand command, Keyspace keyspace, boolean withRangeMerger)
Iterator<ReplicaPlan.ForRangeRead> ranges = new StorageProxy.RangeIterator(command, keyspace, ConsistencyLevel.ONE);
if (withRangeMerger)
ranges = new StorageProxy.RangeMerger(ranges, keyspace, ConsistencyLevel.ONE);
return ranges;
private void verifyRangeCommandIterator(StorageProxy.RangeCommandIterator data, int rows, int batches, int vnodeCount)
int num = Util.size(data);
assertEquals(rows, num);
assertEquals(batches, data.batchesRequested());
assertEquals(vnodeCount, data.rangesQueried());
private List<Token> setTokens(List<Integer> values)
IPartitioner partitioner = DatabaseDescriptor.getPartitioner();
List<Token> tokens = new ArrayList<>(values.size());
for (Integer val : values)
TokenMetadata tmd = StorageService.instance.getTokenMetadata();
tmd.updateNormalTokens(tokens, FBUtilities.getBroadcastAddressAndPort());
return tokens;