| /** |
| * Licensed to the Apache Software Foundation (ASF) under one |
| * or more contributor license agreements. See the NOTICE file |
| * distributed with this work for additional information |
| * regarding copyright ownership. The ASF licenses this file |
| * to you under the Apache License, Version 2.0 (the |
| * "License"); you may not use this file except in compliance |
| * with the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| package org.apache.hadoop.hbase.regionserver; |
| |
| import static org.junit.Assert.assertEquals; |
| import static org.junit.Assert.assertTrue; |
| |
| import java.io.IOException; |
| import java.util.ArrayList; |
| import java.util.Arrays; |
| import java.util.Collection; |
| import java.util.Collections; |
| import java.util.Comparator; |
| import java.util.List; |
| import java.util.NavigableSet; |
| import java.util.TreeSet; |
| import org.apache.hadoop.conf.Configuration; |
| import org.apache.hadoop.fs.FileSystem; |
| import org.apache.hadoop.fs.Path; |
| import org.apache.hadoop.hbase.Cell; |
| import org.apache.hadoop.hbase.CellUtil; |
| import org.apache.hadoop.hbase.HBaseClassTestRule; |
| import org.apache.hadoop.hbase.HBaseTestingUtility; |
| import org.apache.hadoop.hbase.KeyValue; |
| import org.apache.hadoop.hbase.KeyValueTestUtil; |
| import org.apache.hadoop.hbase.client.ColumnFamilyDescriptor; |
| import org.apache.hadoop.hbase.client.ColumnFamilyDescriptorBuilder; |
| import org.apache.hadoop.hbase.client.Put; |
| import org.apache.hadoop.hbase.client.Scan; |
| import org.apache.hadoop.hbase.io.compress.Compression; |
| import org.apache.hadoop.hbase.io.hfile.HFilePrettyPrinter; |
| import org.apache.hadoop.hbase.testclassification.RegionServerTests; |
| import org.apache.hadoop.hbase.testclassification.SmallTests; |
| import org.apache.hadoop.hbase.util.BloomFilterUtil; |
| import org.apache.hadoop.hbase.util.Bytes; |
| import org.junit.Before; |
| import org.junit.ClassRule; |
| import org.junit.Test; |
| import org.junit.experimental.categories.Category; |
| import org.junit.runner.RunWith; |
| import org.junit.runners.Parameterized; |
| import org.junit.runners.Parameterized.Parameters; |
| import org.slf4j.Logger; |
| import org.slf4j.LoggerFactory; |
| |
| /** |
| * Test a multi-column scanner when there is a Bloom filter false-positive. |
| * This is needed for the multi-column Bloom filter optimization. |
| */ |
| @RunWith(Parameterized.class) |
| @Category({RegionServerTests.class, SmallTests.class}) |
| public class TestScanWithBloomError { |
| |
| @ClassRule |
| public static final HBaseClassTestRule CLASS_RULE = |
| HBaseClassTestRule.forClass(TestScanWithBloomError.class); |
| |
| private static final Logger LOG = |
| LoggerFactory.getLogger(TestScanWithBloomError.class); |
| |
| private static final String TABLE_NAME = "ScanWithBloomError"; |
| private static final String FAMILY = "myCF"; |
| private static final byte[] FAMILY_BYTES = Bytes.toBytes(FAMILY); |
| private static final String ROW = "theRow"; |
| private static final String QUALIFIER_PREFIX = "qual"; |
| private static final byte[] ROW_BYTES = Bytes.toBytes(ROW); |
| private static NavigableSet<Integer> allColIds = new TreeSet<>(); |
| private HRegion region; |
| private BloomType bloomType; |
| private FileSystem fs; |
| private Configuration conf; |
| |
| private final static HBaseTestingUtility TEST_UTIL = new HBaseTestingUtility(); |
| |
| @Parameters |
| public static final Collection<Object[]> parameters() { |
| List<Object[]> configurations = new ArrayList<>(); |
| for (BloomType bloomType : BloomType.values()) { |
| configurations.add(new Object[] { bloomType }); |
| } |
| return configurations; |
| } |
| |
| public TestScanWithBloomError(BloomType bloomType) { |
| this.bloomType = bloomType; |
| } |
| |
| @Before |
| public void setUp() throws IOException{ |
| conf = TEST_UTIL.getConfiguration(); |
| fs = FileSystem.get(conf); |
| conf.setInt(BloomFilterUtil.PREFIX_LENGTH_KEY, 10); |
| } |
| |
| @Test |
| public void testThreeStoreFiles() throws IOException { |
| ColumnFamilyDescriptor columnFamilyDescriptor = |
| ColumnFamilyDescriptorBuilder |
| .newBuilder(Bytes.toBytes(FAMILY)) |
| .setCompressionType(Compression.Algorithm.GZ) |
| .setBloomFilterType(bloomType) |
| .setMaxVersions(TestMultiColumnScanner.MAX_VERSIONS).build(); |
| region = TEST_UTIL.createTestRegion(TABLE_NAME, columnFamilyDescriptor); |
| createStoreFile(new int[] {1, 2, 6}); |
| createStoreFile(new int[] {1, 2, 3, 7}); |
| createStoreFile(new int[] {1, 9}); |
| scanColSet(new int[]{1, 4, 6, 7}, new int[]{1, 6, 7}); |
| |
| HBaseTestingUtility.closeRegionAndWAL(region); |
| } |
| |
| private void scanColSet(int[] colSet, int[] expectedResultCols) |
| throws IOException { |
| LOG.info("Scanning column set: " + Arrays.toString(colSet)); |
| Scan scan = new Scan().withStartRow(ROW_BYTES).withStopRow(ROW_BYTES, true); |
| addColumnSetToScan(scan, colSet); |
| RegionScannerImpl scanner = region.getScanner(scan); |
| KeyValueHeap storeHeap = scanner.storeHeap; |
| assertEquals(0, storeHeap.getHeap().size()); |
| StoreScanner storeScanner = |
| (StoreScanner) storeHeap.getCurrentForTesting(); |
| @SuppressWarnings({ "unchecked", "rawtypes" }) |
| List<StoreFileScanner> scanners = (List<StoreFileScanner>) |
| (List) storeScanner.getAllScannersForTesting(); |
| |
| // Sort scanners by their HFile's modification time. |
| Collections.sort(scanners, new Comparator<StoreFileScanner>() { |
| @Override |
| public int compare(StoreFileScanner s1, StoreFileScanner s2) { |
| Path p1 = s1.getReader().getHFileReader().getPath(); |
| Path p2 = s2.getReader().getHFileReader().getPath(); |
| long t1, t2; |
| try { |
| t1 = fs.getFileStatus(p1).getModificationTime(); |
| t2 = fs.getFileStatus(p2).getModificationTime(); |
| } catch (IOException ex) { |
| throw new RuntimeException(ex); |
| } |
| return t1 < t2 ? -1 : t1 == t2 ? 1 : 0; |
| } |
| }); |
| |
| StoreFileReader lastStoreFileReader = null; |
| for (StoreFileScanner sfScanner : scanners) |
| lastStoreFileReader = sfScanner.getReader(); |
| |
| new HFilePrettyPrinter(conf).run(new String[]{ "-m", "-p", "-f", |
| lastStoreFileReader.getHFileReader().getPath().toString()}); |
| |
| // Disable Bloom filter for the last store file. The disabled Bloom filter |
| // will always return "true". |
| LOG.info("Disabling Bloom filter for: " |
| + lastStoreFileReader.getHFileReader().getName()); |
| lastStoreFileReader.disableBloomFilterForTesting(); |
| |
| List<Cell> allResults = new ArrayList<>(); |
| |
| { // Limit the scope of results. |
| List<Cell> results = new ArrayList<>(); |
| while (scanner.next(results) || results.size() > 0) { |
| allResults.addAll(results); |
| results.clear(); |
| } |
| } |
| |
| List<Integer> actualIds = new ArrayList<>(); |
| for (Cell kv : allResults) { |
| String qual = Bytes.toString(CellUtil.cloneQualifier(kv)); |
| assertTrue(qual.startsWith(QUALIFIER_PREFIX)); |
| actualIds.add(Integer.valueOf(qual.substring( |
| QUALIFIER_PREFIX.length()))); |
| } |
| List<Integer> expectedIds = new ArrayList<>(); |
| for (int expectedId : expectedResultCols) |
| expectedIds.add(expectedId); |
| |
| LOG.info("Column ids returned: " + actualIds + ", expected: " |
| + expectedIds); |
| assertEquals(expectedIds.toString(), actualIds.toString()); |
| } |
| |
| private void addColumnSetToScan(Scan scan, int[] colIds) { |
| for (int colId : colIds) { |
| scan.addColumn(FAMILY_BYTES, |
| Bytes.toBytes(qualFromId(colId))); |
| } |
| } |
| |
| private String qualFromId(int colId) { |
| return QUALIFIER_PREFIX + colId; |
| } |
| |
| private void createStoreFile(int[] colIds) |
| throws IOException { |
| Put p = new Put(ROW_BYTES); |
| for (int colId : colIds) { |
| long ts = Long.MAX_VALUE; |
| String qual = qualFromId(colId); |
| allColIds.add(colId); |
| KeyValue kv = KeyValueTestUtil.create(ROW, FAMILY, |
| qual, ts, TestMultiColumnScanner.createValue(ROW, qual, ts)); |
| p.add(kv); |
| } |
| region.put(p); |
| region.flush(true); |
| } |
| |
| |
| } |
| |