blob: 37e4803ae5cc0a9473d6e39694db96b5d44f882e [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.drill.exec.store.delta.format;
import org.apache.calcite.plan.Convention;
import org.apache.calcite.plan.RelOptRule;
import org.apache.drill.common.expression.SchemaPath;
import org.apache.drill.exec.metastore.MetadataProviderManager;
import org.apache.drill.exec.physical.base.AbstractGroupScan;
import org.apache.drill.exec.physical.base.AbstractWriter;
import org.apache.drill.exec.physical.base.PhysicalOperator;
import org.apache.drill.exec.planner.PlannerPhase;
import org.apache.drill.exec.planner.common.DrillStatsTable;
import org.apache.drill.exec.record.metadata.TupleMetadata;
import org.apache.drill.exec.record.metadata.schema.SchemaProvider;
import org.apache.drill.exec.server.DrillbitContext;
import org.apache.drill.exec.server.options.OptionManager;
import org.apache.drill.exec.store.PluginRulesProviderImpl;
import org.apache.drill.exec.store.StoragePluginRulesSupplier;
import org.apache.drill.exec.store.dfs.FileSelection;
import org.apache.drill.exec.store.dfs.FileSystemConfig;
import org.apache.drill.exec.store.dfs.FormatMatcher;
import org.apache.drill.exec.store.dfs.FormatPlugin;
import org.apache.drill.exec.store.delta.DeltaGroupScan;
import org.apache.drill.exec.store.delta.plan.DeltaPluginImplementor;
import org.apache.drill.exec.store.parquet.ParquetReaderConfig;
import org.apache.drill.exec.store.plan.rel.PluginRel;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.Path;
import java.io.IOException;
import java.util.Collections;
import java.util.List;
import java.util.Set;
import java.util.concurrent.atomic.AtomicInteger;
public class DeltaFormatPlugin implements FormatPlugin {
private static final String DELTA_CONVENTION_PREFIX = "DELTA.";
/**
* Generator for format id values. Formats with the same name may be defined
* in multiple storage plugins, so using the unique id within the convention name
* to ensure the rule names will be unique for different plugin instances.
*/
private static final AtomicInteger NEXT_ID = new AtomicInteger(0);
private final FileSystemConfig storageConfig;
private final DeltaFormatPluginConfig config;
private final Configuration fsConf;
private final DrillbitContext context;
private final String name;
private final DeltaFormatMatcher matcher;
private final StoragePluginRulesSupplier storagePluginRulesSupplier;
public DeltaFormatPlugin(
String name,
DrillbitContext context,
Configuration fsConf,
FileSystemConfig storageConfig,
DeltaFormatPluginConfig config) {
this.storageConfig = storageConfig;
this.config = config;
this.fsConf = fsConf;
this.context = context;
this.name = name;
this.matcher = new DeltaFormatMatcher(this);
this.storagePluginRulesSupplier = storagePluginRulesSupplier(name + NEXT_ID.getAndIncrement());
}
private static StoragePluginRulesSupplier storagePluginRulesSupplier(String name) {
Convention convention = new Convention.Impl(DELTA_CONVENTION_PREFIX + name, PluginRel.class);
return StoragePluginRulesSupplier.builder()
.rulesProvider(new PluginRulesProviderImpl(convention, DeltaPluginImplementor::new))
.supportsFilterPushdown(true)
.supportsProjectPushdown(true)
.supportsLimitPushdown(true)
.convention(convention)
.build();
}
@Override
public boolean supportsRead() {
return true;
}
@Override
public boolean supportsWrite() {
return false;
}
@Override
public boolean supportsAutoPartitioning() {
return false;
}
@Override
public FormatMatcher getMatcher() {
return matcher;
}
@Override
public AbstractWriter getWriter(PhysicalOperator child, String location, List<String> partitionColumns) {
throw new UnsupportedOperationException();
}
@Override
public Set<? extends RelOptRule> getOptimizerRules(PlannerPhase phase) {
switch (phase) {
case PHYSICAL:
case LOGICAL:
return storagePluginRulesSupplier.getOptimizerRules();
case LOGICAL_PRUNE_AND_JOIN:
case LOGICAL_PRUNE:
case PARTITION_PRUNING:
case JOIN_PLANNING:
default:
return Collections.emptySet();
}
}
@Override
public AbstractGroupScan getGroupScan(String userName, FileSelection selection, List<SchemaPath> columns) throws IOException {
return getGroupScan(userName, selection, columns, (OptionManager) null);
}
@Override
public AbstractGroupScan getGroupScan(String userName, FileSelection selection, List<SchemaPath> columns, OptionManager options) throws IOException {
return getGroupScan(userName, selection, columns, options, null);
}
@Override
public AbstractGroupScan getGroupScan(String userName, FileSelection selection,
List<SchemaPath> columns, OptionManager options, MetadataProviderManager metadataProviderManager) throws IOException {
ParquetReaderConfig readerConfig = ParquetReaderConfig.builder()
.withConf(fsConf)
.withOptions(options)
.build();
return DeltaGroupScan.builder()
.userName(userName)
.formatPlugin(this)
.readerConfig(readerConfig)
.path(selection.selectionRoot.toUri().getPath())
.columns(columns)
.limit(-1)
.build();
}
@Override
public AbstractGroupScan getGroupScan(String userName, FileSelection selection,
List<SchemaPath> columns, MetadataProviderManager metadataProviderManager) throws IOException {
SchemaProvider schemaProvider = metadataProviderManager.getSchemaProvider();
TupleMetadata schema = schemaProvider != null
? schemaProvider.read().getSchema()
: null;
return DeltaGroupScan.builder()
.userName(userName)
.formatPlugin(this)
.readerConfig(ParquetReaderConfig.builder().withConf(fsConf).build())
.schema(schema)
.path(selection.selectionRoot.toUri().getPath())
.columns(columns)
.limit(-1)
.build();
}
@Override
public boolean supportsStatistics() {
return false;
}
@Override
public DrillStatsTable.TableStatistics readStatistics(FileSystem fs, Path statsTablePath) {
throw new UnsupportedOperationException("unimplemented");
}
@Override
public void writeStatistics(DrillStatsTable.TableStatistics statistics, FileSystem fs, Path statsTablePath) {
throw new UnsupportedOperationException("unimplemented");
}
@Override
public DeltaFormatPluginConfig getConfig() {
return config;
}
@Override
public FileSystemConfig getStorageConfig() {
return storageConfig;
}
@Override
public Configuration getFsConf() {
return fsConf;
}
@Override
public DrillbitContext getContext() {
return context;
}
@Override
public String getName() {
return name;
}
public Convention getConvention() {
return storagePluginRulesSupplier.convention();
}
}