blob: 1c13773ac8867257b35141ebdb9545f93a0f5ee1 [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.drill.exec.planner.logical;
import java.util.ArrayList;
import java.util.List;
import org.apache.calcite.rel.RelWriter;
import org.apache.calcite.rel.metadata.RelMetadataQuery;
import org.apache.drill.common.JSONOptions;
import org.apache.drill.common.expression.SchemaPath;
import org.apache.drill.common.logical.data.LogicalOperator;
import org.apache.drill.common.logical.data.Scan;
import org.apache.drill.exec.physical.base.GroupScan;
import org.apache.drill.exec.physical.base.ScanStats;
import org.apache.drill.exec.planner.common.DrillScanRelBase;
import org.apache.drill.exec.planner.physical.PlannerSettings;
import org.apache.drill.exec.planner.physical.PrelUtil;
import org.apache.drill.exec.planner.torel.ConversionContext;
import org.apache.calcite.plan.RelOptCluster;
import org.apache.calcite.plan.RelOptCost;
import org.apache.calcite.plan.RelOptPlanner;
import org.apache.calcite.plan.RelOptTable;
import org.apache.calcite.plan.RelTraitSet;
import org.apache.calcite.rel.type.RelDataType;
import com.google.common.base.Preconditions;
import org.apache.drill.exec.util.Utilities;
/**
* GroupScan of a Drill table.
*/
public class DrillScanRel extends DrillScanRelBase implements DrillRel {
public static final int STAR_COLUMN_COST = 10_000;
private PlannerSettings settings;
private final List<SchemaPath> columns;
private final boolean partitionFilterPushdown;
private final RelDataType rowType;
public DrillScanRel(final RelOptCluster cluster, final RelTraitSet traits,
final RelOptTable table) {
this(cluster, traits, table, false);
}
public DrillScanRel(final RelOptCluster cluster, final RelTraitSet traits,
final RelOptTable table, boolean partitionFilterPushdown) {
this(cluster, traits, table, table.getRowType(), getProjectedColumns(table, false), partitionFilterPushdown);
this.settings = PrelUtil.getPlannerSettings(cluster.getPlanner());
}
public DrillScanRel(final RelOptCluster cluster, final RelTraitSet traits,
final RelOptTable table, final RelDataType rowType, final List<SchemaPath> columns) {
this(cluster, traits, table, rowType, columns, false);
}
public DrillScanRel(final RelOptCluster cluster, final RelTraitSet traits,
final RelOptTable table, final RelDataType rowType, final List<SchemaPath> columns, boolean partitionFilterPushdown) {
super(cluster, traits, table, columns);
this.settings = PrelUtil.getPlannerSettings(cluster.getPlanner());
this.rowType = rowType;
Preconditions.checkNotNull(columns);
this.columns = columns;
this.partitionFilterPushdown = partitionFilterPushdown;
}
/** Creates a DrillScanRel for a particular GroupScan */
public DrillScanRel(final RelOptCluster cluster, final RelTraitSet traits,
final RelOptTable table, final GroupScan groupScan, final RelDataType rowType, final List<SchemaPath> columns) {
this(cluster, traits, table, groupScan, rowType, columns, false);
}
/** Creates a DrillScanRel for a particular GroupScan */
public DrillScanRel(final RelOptCluster cluster, final RelTraitSet traits,
final RelOptTable table, final GroupScan groupScan, final RelDataType rowType, final List<SchemaPath> columns, boolean partitionFilterPushdown) {
super(cluster, traits, groupScan, table);
this.rowType = rowType;
this.columns = columns;
this.settings = PrelUtil.getPlannerSettings(cluster.getPlanner());
this.partitionFilterPushdown = partitionFilterPushdown;
}
public List<SchemaPath> getColumns() {
return this.columns;
}
@Override
public LogicalOperator implement(DrillImplementor implementor) {
Scan.Builder builder = Scan.builder();
builder.storageEngine(drillTable.getStorageEngineName());
builder.selection(new JSONOptions(drillTable.getSelection()));
implementor.registerSource(drillTable);
return builder.build();
}
public static DrillScanRel convert(Scan scan, ConversionContext context) {
return new DrillScanRel(context.getCluster(), context.getLogicalTraits(),
context.getTable(scan));
}
@Override
public RelDataType deriveRowType() {
return this.rowType;
}
@Override
public RelWriter explainTerms(RelWriter pw) {
return super.explainTerms(pw).item("groupscan", getGroupScan().getDigest());
}
@Override
public double estimateRowCount(RelMetadataQuery mq) {
return getGroupScan().getScanStats(settings).getRecordCount();
}
// TODO: this method is same as the one for ScanPrel...eventually we should consolidate
// this and few other methods in a common base class which would be extended
// by both logical and physical rels.
// TODO: Further changes may have caused the versions to diverge.
// TODO: Does not compute IO cost by default, but should. Changing that may break
// existing plugins.
@Override
public RelOptCost computeSelfCost(final RelOptPlanner planner, RelMetadataQuery mq) {
final ScanStats stats = getGroupScan().getScanStats(settings);
double columnCount = Utilities.isStarQuery(columns)
? STAR_COLUMN_COST
: Math.pow(getRowType().getFieldCount(), 2) / Math.max(columns.size(), 1);
// double rowCount = RelMetadataQuery.getRowCount(this);
double rowCount = Math.max(1, stats.getRecordCount());
double valueCount = rowCount * columnCount;
if (PrelUtil.getSettings(getCluster()).useDefaultCosting()) {
// TODO: makeCost() wants a row count, but we provide a value count.
// Likely a bug, but too risky to change as it may affect existing plugins.
// If we do make the fix, then the default costing path is the same as the
// full cost path.
// TODO: At this late date, with many plugins exploiting (if only by
// accident) the default costing here, it is not clear if we even want
// the planner to control the cost model. That is, remove this path.
return planner.getCostFactory().makeCost(valueCount, stats.getCpuCost(), stats.getDiskCost());
}
double cpuCost;
double ioCost;
if (stats.getGroupScanProperty().hasFullCost()) {
cpuCost = stats.getCpuCost();
ioCost = stats.getDiskCost();
} else {
// for now, assume cpu cost is proportional to row count and number of columns
cpuCost = valueCount;
// Default io cost should be proportional to valueCount
ioCost = 0;
}
return planner.getCostFactory().makeCost(rowCount, cpuCost, ioCost);
}
public boolean partitionFilterPushdown() {
return this.partitionFilterPushdown;
}
public static List<SchemaPath> getProjectedColumns(final RelOptTable table, boolean isSelectStar) {
List<String> columnNames = table.getRowType().getFieldNames();
List<SchemaPath> projectedColumns = new ArrayList<>(columnNames.size());
for (String columnName : columnNames) {
projectedColumns.add(SchemaPath.getSimplePath(columnName));
}
// If the row-type doesn't contain the STAR keyword, then insert it
// as we are dealing with a SELECT_STAR query.
if (isSelectStar && !Utilities.isStarQuery(projectedColumns)) {
projectedColumns.add(SchemaPath.STAR_COLUMN);
}
return projectedColumns;
}
@Override
public DrillScanRel copy(RelTraitSet traitSet, GroupScan scan, RelDataType rowType) {
return new DrillScanRel(getCluster(), getTraitSet(), getTable(), scan, rowType, getColumns(), partitionFilterPushdown());
}
}