blob: df675dfa32956c69b8d46dd5d04ad8e306b4d535 [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.drill.exec.store.delta;
import com.fasterxml.jackson.annotation.JacksonInject;
import com.fasterxml.jackson.annotation.JsonCreator;
import com.fasterxml.jackson.annotation.JsonProperty;
import com.fasterxml.jackson.annotation.JsonTypeName;
import org.apache.drill.common.expression.LogicalExpression;
import org.apache.drill.common.expression.SchemaPath;
import org.apache.drill.common.logical.FormatPluginConfig;
import org.apache.drill.common.logical.StoragePluginConfig;
import org.apache.drill.exec.physical.base.PhysicalOperator;
import org.apache.drill.exec.record.metadata.TupleMetadata;
import org.apache.drill.exec.store.StoragePluginRegistry;
import org.apache.drill.exec.store.delta.format.DeltaFormatPlugin;
import org.apache.drill.exec.store.delta.format.DeltaFormatPluginConfig;
import org.apache.drill.exec.store.parquet.AbstractParquetRowGroupScan;
import org.apache.drill.exec.store.parquet.ParquetReaderConfig;
import org.apache.drill.exec.store.parquet.RowGroupReadEntry;
import org.apache.drill.shaded.guava.com.google.common.base.Preconditions;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.Path;
import java.util.Collections;
import java.util.List;
import java.util.Map;
@JsonTypeName("delta-row-group-scan")
public class DeltaRowGroupScan extends AbstractParquetRowGroupScan {
public static final String OPERATOR_TYPE = "DELTA_ROW_GROUP_SCAN";
private final DeltaFormatPlugin formatPlugin;
private final DeltaFormatPluginConfig formatPluginConfig;
private final Map<Path, Map<String, String>> partitions;
@JsonCreator
public DeltaRowGroupScan(@JacksonInject StoragePluginRegistry registry,
@JsonProperty("userName") String userName,
@JsonProperty("storageConfig") StoragePluginConfig storageConfig,
@JsonProperty("formatPluginConfig") FormatPluginConfig formatPluginConfig,
@JsonProperty("rowGroupReadEntries") List<RowGroupReadEntry> rowGroupReadEntries,
@JsonProperty("columns") List<SchemaPath> columns,
@JsonProperty("partitions") Map<Path, Map<String, String>> partitions,
@JsonProperty("readerConfig") ParquetReaderConfig readerConfig,
@JsonProperty("filter") LogicalExpression filter,
@JsonProperty("schema") TupleMetadata schema) {
this(userName,
registry.resolveFormat(storageConfig, formatPluginConfig, DeltaFormatPlugin.class),
rowGroupReadEntries,
columns,
partitions,
readerConfig,
filter,
schema);
}
public DeltaRowGroupScan(String userName,
DeltaFormatPlugin formatPlugin,
List<RowGroupReadEntry> rowGroupReadEntries,
List<SchemaPath> columns,
Map<Path, Map<String, String>> partitions,
ParquetReaderConfig readerConfig,
LogicalExpression filter,
TupleMetadata schema) {
super(userName, rowGroupReadEntries, columns, readerConfig, filter,null, schema);
this.formatPlugin = formatPlugin;
this.formatPluginConfig = formatPlugin.getConfig();
this.partitions = partitions;
}
@JsonProperty
public StoragePluginConfig getStorageConfig() {
return formatPlugin.getStorageConfig();
}
@JsonProperty
public DeltaFormatPluginConfig getFormatPluginConfig() {
return formatPluginConfig;
}
@JsonProperty
public Map<Path, Map<String, String>> getPartitions() {
return partitions;
}
@Override
public PhysicalOperator getNewWithChildren(List<PhysicalOperator> children) {
Preconditions.checkArgument(children.isEmpty());
return new DeltaRowGroupScan(getUserName(), formatPlugin, rowGroupReadEntries, columns, partitions,
readerConfig, filter, schema);
}
@Override
public String getOperatorType() {
return OPERATOR_TYPE;
}
@Override
public AbstractParquetRowGroupScan copy(List<SchemaPath> columns) {
return new DeltaRowGroupScan(getUserName(), formatPlugin, rowGroupReadEntries, columns, partitions,
readerConfig, filter, schema);
}
@Override
public Configuration getFsConf(RowGroupReadEntry rowGroupReadEntry) {
return formatPlugin.getFsConf();
}
@Override
public boolean supportsFileImplicitColumns() {
return true;
}
@Override
public List<String> getPartitionValues(RowGroupReadEntry rowGroupReadEntry) {
return Collections.emptyList();
}
public Map<String, String> getPartitions(RowGroupReadEntry rowGroupReadEntry) {
return partitions.get(rowGroupReadEntry.getPath());
}
@Override
public boolean isImplicitColumn(SchemaPath path, String partitionColumnLabel) {
return partitions.values().stream()
.anyMatch(map -> map.containsKey(path.getAsUnescapedPath()));
}
}