blob: 59fb21f5220dcf95d8624888e2c80e509ca922c7 [file] [log] [blame]
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* See the License for the specific language governing permissions and
* limitations under the License.
package org.apache.phoenix.iterate;
import static org.apache.phoenix.coprocessor.ScanRegionObserver.WILDCARD_SCAN_INCLUDES_DYNAMIC_COLUMNS;
import static org.apache.phoenix.schema.types.PDataType.TRUE_BYTES;
import org.apache.hadoop.hbase.CellUtil;
import org.apache.phoenix.coprocessor.UncoveredGlobalIndexRegionScanner;
import org.apache.phoenix.coprocessor.UncoveredLocalIndexRegionScanner;
import org.apache.phoenix.schema.KeyValueSchema;
import org.apache.phoenix.schema.PColumn;
import org.apache.phoenix.schema.PColumnImpl;
import org.apache.phoenix.schema.PTable;
import org.apache.phoenix.schema.ValueBitSet;
import org.apache.hadoop.hbase.Cell;
import org.apache.hadoop.hbase.HConstants;
import org.apache.hadoop.hbase.KeyValue;
import org.apache.hadoop.hbase.client.RegionInfo;
import org.apache.hadoop.hbase.client.Result;
import org.apache.hadoop.hbase.client.Scan;
import org.apache.hadoop.hbase.coprocessor.RegionCoprocessorEnvironment;
import org.apache.hadoop.hbase.regionserver.Region;
import org.apache.hadoop.hbase.regionserver.RegionScanner;
import org.apache.hadoop.hbase.regionserver.ScannerContext;
import org.apache.hadoop.hbase.regionserver.ScannerContextUtil;
import org.apache.hadoop.hbase.util.Bytes;
import org.apache.hadoop.hbase.util.Pair;
import org.apache.phoenix.coprocessor.BaseScannerRegionObserver;
import org.apache.phoenix.coprocessor.generated.DynamicColumnMetaDataProtos;
import org.apache.phoenix.execute.TupleProjector;
import org.apache.phoenix.expression.Expression;
import org.apache.phoenix.expression.ExpressionType;
import org.apache.phoenix.expression.KeyValueColumnExpression;
import org.apache.phoenix.hbase.index.covered.update.ColumnReference;
import org.apache.phoenix.index.IndexMaintainer;
import org.apache.phoenix.query.QueryConstants;
import org.apache.phoenix.schema.tuple.MultiKeyValueTuple;
import org.apache.phoenix.schema.tuple.PositionBasedResultTuple;
import org.apache.phoenix.schema.tuple.ResultTuple;
import org.apache.phoenix.schema.tuple.Tuple;
import org.apache.phoenix.transaction.PhoenixTransactionContext;
import org.apache.phoenix.util.EncodedColumnsUtil;
import org.apache.phoenix.util.EnvironmentEdgeManager;
import org.apache.phoenix.util.IndexUtil;
import org.apache.phoenix.util.ScanUtil;
import org.apache.phoenix.util.ServerUtil;
import java.util.ArrayList;
import java.util.List;
import java.util.ListIterator;
import java.util.Set;
public abstract class RegionScannerFactory {
protected RegionCoprocessorEnvironment env;
* Returns the region based on the value of the
* region context
* @return
public Region getRegion() {
return env.getRegion();
* Returns a processed region scanner based on the query
* conditions. Thie functionality is abstracted out of
* the non-aggregate region observer class for better
* usage
* @param scan input scan
* @param s input region scanner
* @return
* @throws Throwable
public abstract RegionScanner getRegionScanner(final Scan scan, final RegionScanner s) throws Throwable;
* Return wrapped scanner that catches unexpected exceptions (i.e. Phoenix bugs) and
* re-throws as DoNotRetryIOException to prevent needless retrying hanging the query
* for 30 seconds. Unfortunately, until HBASE-7481 gets fixed, there's no way to do
* the same from a custom filter.
* @param arrayKVRefs
* @param arrayFuncRefs
* @param offset starting position in the rowkey.
* @param scan
* @param tupleProjector
* @param dataRegion
* @param indexMaintainer
* @param tx current transaction
* @param viewConstants
public RegionScanner getWrappedScanner(final RegionCoprocessorEnvironment env,
final RegionScanner regionScanner, final Set<KeyValueColumnExpression> arrayKVRefs,
final Expression[] arrayFuncRefs, final int offset, final Scan scan,
final ColumnReference[] dataColumns, final TupleProjector tupleProjector,
final Region dataRegion, final IndexMaintainer indexMaintainer,
PhoenixTransactionContext tx,
final byte[][] viewConstants, final KeyValueSchema kvSchema,
final ValueBitSet kvSchemaBitSet, final TupleProjector projector,
final ImmutableBytesWritable ptr, final boolean useQualifierAsListIndex) throws IOException {
return new RegionScanner() {
private RegionScanner s = regionScanner;
private RegionInfo regionInfo = env.getRegionInfo();
private byte[] actualStartKey = getActualStartKey();
private boolean useNewValueColumnQualifier = EncodedColumnsUtil.useNewValueColumnQualifier(scan);
final long pageSizeMs = ScanUtil.getPageSizeMsForRegionScanner(scan);
Expression extraWhere = null;
long extraLimit = -1;
// for indexes construct the row filter for uncovered columns if it exists
if (ScanUtil.isLocalOrUncoveredGlobalIndex(scan)) {
byte[] expBytes = scan.getAttribute(BaseScannerRegionObserver.INDEX_FILTER);
if (expBytes == null) {
// For older clients
expBytes = scan.getAttribute(BaseScannerRegionObserver.LOCAL_INDEX_FILTER);
if (expBytes != null) {
try {
ByteArrayInputStream stream = new ByteArrayInputStream(expBytes);
DataInputStream input = new DataInputStream(stream);
extraWhere = ExpressionType.values()[WritableUtils.readVInt(input)].newInstance();
} catch (IOException io) {
// should not happen since we're reading from a byte[]
throw new RuntimeException(io);
byte[] limitBytes = scan.getAttribute(BaseScannerRegionObserver.INDEX_LIMIT);
if (limitBytes == null) {
// For older clients
limitBytes = scan.getAttribute(BaseScannerRegionObserver.LOCAL_INDEX_LIMIT);
if (limitBytes != null) {
extraLimit = Bytes.toLong(limitBytes);
if (ScanUtil.isLocalOrUncoveredGlobalIndex(scan)
&& (tupleProjector != null
|| (indexMaintainer != null && indexMaintainer.isUncovered()))) {
PTable.ImmutableStorageScheme storageScheme =
Scan dataTableScan = new Scan();
if (dataColumns != null) {
for (int i = 0; i < dataColumns.length; i++) {
if (storageScheme ==
PTable.ImmutableStorageScheme.SINGLE_CELL_ARRAY_WITH_OFFSETS) {
} else {
} else if (indexMaintainer.isUncovered()) {
// Indexed columns should also be added to the data columns to join for uncovered global indexes.
// This is required to verify the index row against the data table row.
for (ColumnReference cr: indexMaintainer.getIndexedColumns()) {
if (storageScheme == PTable.ImmutableStorageScheme.SINGLE_CELL_ARRAY_WITH_OFFSETS) {
} else {
dataTableScan.addColumn(cr.getFamily(), cr.getQualifier());
if (ScanUtil.isLocalIndex(scan)) {
s = new UncoveredLocalIndexRegionScanner(regionScanner, dataRegion, scan, env,
dataTableScan, tupleProjector, indexMaintainer, viewConstants, ptr,
pageSizeMs, offset, actualStartKey, extraLimit);
} else {
s = new UncoveredGlobalIndexRegionScanner(regionScanner, dataRegion, scan, env,
dataTableScan, tupleProjector, indexMaintainer, viewConstants, ptr,
pageSizeMs, extraLimit);
// Get the actual scan start row of local index. This will be used to compare the row
// key of the results less than scan start row when there are references.
public byte[] getActualStartKey() {
return ScanUtil.isLocalIndex(scan) ? ScanUtil.getActualStartRow(scan, regionInfo)
: null;
public boolean next(List<Cell> results) throws IOException {
try {
boolean next =;
if (ScanUtil.isDummy(results)) {
return true;
return next;
} catch (Throwable t) {
ServerUtil.throwIOException(getRegion().getRegionInfo().getRegionNameAsString(), t);
return false; // impossible
public boolean next(List<Cell> result, ScannerContext scannerContext) throws IOException {
throw new IOException("Next with scannerContext should not be called in Phoenix environment");
public void close() throws IOException {
public RegionInfo getRegionInfo() {
return s.getRegionInfo();
public boolean isFilterDone() throws IOException {
return s.isFilterDone();
public boolean reseek(byte[] row) throws IOException {
return s.reseek(row);
public long getMvccReadPoint() {
return s.getMvccReadPoint();
public boolean nextRaw(List<Cell> result) throws IOException {
try {
boolean next = s.nextRaw(result);
if (ScanUtil.isDummy(result)) {
return true;
if (result.size() == 0) {
return next;
if ((ScanUtil.isLocalOrUncoveredGlobalIndex(scan))
&& !ScanUtil.isAnalyzeTable(scan)) {
if (ScanUtil.isLocalIndex(scan) && tupleProjector == null) {
if (actualStartKey != null) {
next = scanTillScanStartRow(s, result, null);
if (result.isEmpty() || ScanUtil.isDummy(result)) {
return next;
IndexUtil.wrapResultUsingOffset(result, offset);
if (extraWhere != null) {
Tuple merged = useQualifierAsListIndex ? new PositionBasedResultTuple(result) :
new ResultTuple(Result.create(result));
ImmutableBytesWritable ptr = new ImmutableBytesWritable();
extraWhere.evaluate(merged, ptr);
if (!Boolean.TRUE.equals(extraWhere.getDataType().toObject(ptr))) {
return next;
Cell arrayElementCell = null;
if (arrayFuncRefs != null && arrayFuncRefs.length > 0 && arrayKVRefs.size() > 0) {
int arrayElementCellPosition = replaceArrayIndexElement(arrayKVRefs, arrayFuncRefs, result);
arrayElementCell = result.get(arrayElementCellPosition);
if (projector != null) {
Tuple toProject = useQualifierAsListIndex ? new PositionBasedResultTuple(result) :
new ResultTuple(Result.create(result));
Pair<Tuple, byte[]> mergedTupleDynColsPair = getTupleWithDynColsIfRequired(result,
projector.projectResults(toProject, useNewValueColumnQualifier));
Tuple tupleWithDynColsIfReqd = mergedTupleDynColsPair.getFirst();
byte[] serializedDynColsList = mergedTupleDynColsPair.getSecond();
if (arrayElementCell != null) {
if (extraLimit >= 0 && --extraLimit == 0) {
return false;
// There is a scanattribute set to retrieve the specific array element
return next;
} catch (Throwable t) {
ServerUtil.throwIOException(getRegion().getRegionInfo().getRegionNameAsString(), t);
return false; // impossible
* Iterate over the list of cells returned from the scan and use the dynamic column metadata
* to create a tuple projector for dynamic columns. Finally, merge this with the projected
* values corresponding to the known columns
* @param result list of cells returned from the scan
* @param tuple projected value tuple from known schema/columns
* @return A pair, whose first part is a combined projected value tuple containing the
* known column values along with resolved dynamic column values and whose second part is
* the serialized list of dynamic column PColumns. In case dynamic columns are not
* to be exposed or are not present, this returns the original tuple and an empty byte array.
* @throws IOException Thrown if there is an error parsing protobuf or merging projected
* values
private Pair<Tuple, byte[]> getTupleWithDynColsIfRequired(List<Cell> result, Tuple tuple)
throws IOException {
// We only care about dynamic column cells if the scan has this attribute set
if (Bytes.equals(scan.getAttribute(WILDCARD_SCAN_INCLUDES_DYNAMIC_COLUMNS), TRUE_BYTES)) {
List<PColumn> dynCols = new ArrayList<>();
List<Cell> dynColCells = new ArrayList<>();
TupleProjector dynColTupleProj = TupleProjector.getDynamicColumnsTupleProjector(result,
dynCols, dynColCells);
if (dynColTupleProj != null) {
Tuple toProject = useQualifierAsListIndex ? new PositionBasedResultTuple(dynColCells) :
new ResultTuple(Result.create(dynColCells));
Tuple dynColsProjectedTuple = dynColTupleProj
.projectResults(toProject, useNewValueColumnQualifier);
ValueBitSet destBitSet = projector.getValueBitSet();
// In case we are not projecting any non-row key columns, the field count for the
// current projector will be 0, so we simply use the dynamic column projector's
// value bitset as the destination bitset.
if (projector.getSchema().getFieldCount() == 0) {
destBitSet = dynColTupleProj.getValueBitSet();
// Add dynamic column data at the end of the projected tuple
Tuple mergedTuple = TupleProjector.mergeProjectedValue(
(TupleProjector.ProjectedValueTuple)tuple, destBitSet, dynColsProjectedTuple,
dynColTupleProj.getValueBitSet(), projector.getSchema().getFieldCount(),
// We send the serialized list of PColumns for dynamic columns back to the client
// so that the client can process the corresponding projected values
DynamicColumnMetaDataProtos.DynamicColumnMetaData.Builder dynColsListBuilder =
for (PColumn dynCol : dynCols) {
return new Pair<>(mergedTuple,;
return new Pair<>(tuple, new byte[0]);
public boolean nextRaw(List<Cell> result, ScannerContext scannerContext)
throws IOException {
boolean res = next(result);
ScannerContextUtil.incrementSizeProgress(scannerContext, result);
return res;
* When there is a merge in progress while scanning local indexes we might get the key values less than scan start row.
* In that case we need to scan until get the row key more or equal to scan start key.
* TODO try to fix this case in LocalIndexStoreFileScanner when there is a merge.
private boolean scanTillScanStartRow(final RegionScanner s,
List<Cell> result,
ScannerContext scannerContext) throws IOException {
boolean next = true;
Cell firstCell = result.get(0);
long startTime = EnvironmentEdgeManager.currentTimeMillis();
while (Bytes.compareTo(firstCell.getRowArray(), firstCell.getRowOffset(),
firstCell.getRowLength(), actualStartKey, 0, actualStartKey.length) < 0) {
if (EnvironmentEdgeManager.currentTimeMillis() - startTime >= pageSizeMs) {
byte[] rowKey = CellUtil.cloneRow(result.get(0));
ScanUtil.getDummyResult(rowKey, result);
return true;
if(scannerContext == null) {
next = s.nextRaw(result);
} else {
next = s.nextRaw(result, scannerContext);
if (result.isEmpty()) {
return next;
if (ScanUtil.isDummy(result)) {
return true;
firstCell = result.get(0);
return next;
private int replaceArrayIndexElement(final Set<KeyValueColumnExpression> arrayKVRefs,
final Expression[] arrayFuncRefs, List<Cell> result) {
// make a copy of the results array here, as we're modifying it below
MultiKeyValueTuple tuple = new MultiKeyValueTuple(ImmutableList.copyOf(result));
// The size of both the arrays would be same?
// Using KeyValueSchema to set and retrieve the value
// collect the first kv to get the row
Cell rowKv = result.get(0);
for (KeyValueColumnExpression kvExp : arrayKVRefs) {
if (kvExp.evaluate(tuple, ptr)) {
ListIterator<Cell> itr = result.listIterator();
while (itr.hasNext()) {
Cell kv =;
if (Bytes.equals(kvExp.getColumnFamily(), 0, kvExp.getColumnFamily().length,
kv.getFamilyArray(), kv.getFamilyOffset(), kv.getFamilyLength())
&& Bytes.equals(kvExp.getColumnQualifier(), 0, kvExp.getColumnQualifier().length,
kv.getQualifierArray(), kv.getQualifierOffset(), kv.getQualifierLength())) {
// remove the kv that has the full array values.
byte[] value = kvSchema.toBytes(tuple, arrayFuncRefs,
kvSchemaBitSet, ptr);
// Add a dummy kv with the exact value of the array index
result.add(new KeyValue(rowKv.getRowArray(), rowKv.getRowOffset(), rowKv.getRowLength(),
KeyValue.Type.codeToType(rowKv.getType().getCode()), value, 0, value.length));
return getArrayCellPosition(result);
public long getMaxResultSize() {
return s.getMaxResultSize();
public int getBatch() {
return s.getBatch();
// PHOENIX-4791 Share position of array element cell
public static int getArrayCellPosition(List<Cell> result) {
return result.size() - 1;