| /* |
| * Licensed to the Apache Software Foundation (ASF) under one |
| * or more contributor license agreements. See the NOTICE file |
| * distributed with this work for additional information |
| * regarding copyright ownership. The ASF licenses this file |
| * to you under the Apache License, Version 2.0 (the |
| * "License"); you may not use this file except in compliance |
| * with the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, |
| * software distributed under the License is distributed on an |
| * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
| * KIND, either express or implied. See the License for the |
| * specific language governing permissions and limitations |
| * under the License. |
| */ |
| |
| package org.apache.hyracks.algebricks.core.algebra.operators.physical; |
| |
| import java.util.ArrayList; |
| import java.util.List; |
| |
| import org.apache.hyracks.algebricks.common.constraints.AlgebricksPartitionConstraint; |
| import org.apache.hyracks.algebricks.common.exceptions.AlgebricksException; |
| import org.apache.hyracks.algebricks.common.utils.Pair; |
| import org.apache.hyracks.algebricks.core.algebra.base.IHyracksJobBuilder; |
| import org.apache.hyracks.algebricks.core.algebra.base.ILogicalOperator; |
| import org.apache.hyracks.algebricks.core.algebra.base.IOptimizationContext; |
| import org.apache.hyracks.algebricks.core.algebra.base.LogicalVariable; |
| import org.apache.hyracks.algebricks.core.algebra.base.PhysicalOperatorTag; |
| import org.apache.hyracks.algebricks.core.algebra.expressions.IVariableTypeEnvironment; |
| import org.apache.hyracks.algebricks.core.algebra.metadata.IDataSourceIndex; |
| import org.apache.hyracks.algebricks.core.algebra.metadata.IMetadataProvider; |
| import org.apache.hyracks.algebricks.core.algebra.operators.logical.AbstractLogicalOperator; |
| import org.apache.hyracks.algebricks.core.algebra.operators.logical.IOperatorSchema; |
| import org.apache.hyracks.algebricks.core.algebra.operators.logical.InsertDeleteOperator.Kind; |
| import org.apache.hyracks.algebricks.core.algebra.operators.logical.TokenizeOperator; |
| import org.apache.hyracks.algebricks.core.algebra.properties.IPhysicalPropertiesVector; |
| import org.apache.hyracks.algebricks.core.algebra.properties.PhysicalRequirements; |
| import org.apache.hyracks.algebricks.core.algebra.properties.StructuralPropertiesVector; |
| import org.apache.hyracks.algebricks.core.jobgen.impl.JobGenContext; |
| import org.apache.hyracks.algebricks.core.jobgen.impl.JobGenHelper; |
| import org.apache.hyracks.api.dataflow.IOperatorDescriptor; |
| import org.apache.hyracks.api.dataflow.value.RecordDescriptor; |
| import org.apache.hyracks.api.job.JobSpecification; |
| |
| public class TokenizePOperator extends AbstractPhysicalOperator { |
| |
| private final List<LogicalVariable> primaryKeys; |
| private final List<LogicalVariable> secondaryKeys; |
| private final IDataSourceIndex<?, ?> dataSourceIndex; |
| |
| public TokenizePOperator(List<LogicalVariable> primaryKeys, List<LogicalVariable> secondaryKeys, |
| IDataSourceIndex<?, ?> dataSourceIndex) { |
| this.primaryKeys = primaryKeys; |
| this.secondaryKeys = secondaryKeys; |
| this.dataSourceIndex = dataSourceIndex; |
| } |
| |
| @Override |
| public PhysicalOperatorTag getOperatorTag() { |
| return PhysicalOperatorTag.TOKENIZE; |
| } |
| |
| @Override |
| public PhysicalRequirements getRequiredPropertiesForChildren(ILogicalOperator op, |
| IPhysicalPropertiesVector reqdByParent) { |
| return emptyUnaryRequirements(); |
| } |
| |
| @Override |
| public void computeDeliveredProperties(ILogicalOperator op, IOptimizationContext context) |
| throws AlgebricksException { |
| AbstractLogicalOperator op2 = (AbstractLogicalOperator) op.getInputs().get(0).getValue(); |
| deliveredProperties = (StructuralPropertiesVector) op2.getDeliveredPhysicalProperties().clone(); |
| } |
| |
| @Override |
| public void contributeRuntimeOperator(IHyracksJobBuilder builder, JobGenContext context, ILogicalOperator op, |
| IOperatorSchema propagatedSchema, IOperatorSchema[] inputSchemas, IOperatorSchema outerPlanSchema) |
| throws AlgebricksException { |
| TokenizeOperator tokenizeOp = (TokenizeOperator) op; |
| if (tokenizeOp.getOperation() != Kind.INSERT || !tokenizeOp.isBulkload()) { |
| throw new AlgebricksException("Tokenize Operator only works when bulk-loading data."); |
| } |
| |
| IMetadataProvider mp = context.getMetadataProvider(); |
| IVariableTypeEnvironment typeEnv = context.getTypeEnvironment(op); |
| JobSpecification spec = builder.getJobSpec(); |
| RecordDescriptor inputDesc = JobGenHelper.mkRecordDescriptor( |
| context.getTypeEnvironment(op.getInputs().get(0).getValue()), inputSchemas[0], context); |
| Pair<IOperatorDescriptor, AlgebricksPartitionConstraint> runtimeAndConstraints = mp.getTokenizerRuntime( |
| dataSourceIndex, propagatedSchema, inputSchemas, typeEnv, primaryKeys, secondaryKeys, null, inputDesc, |
| context, spec, true); |
| builder.contributeHyracksOperator(tokenizeOp, runtimeAndConstraints.first); |
| builder.contributeAlgebricksPartitionConstraint(runtimeAndConstraints.first, runtimeAndConstraints.second); |
| ILogicalOperator src = tokenizeOp.getInputs().get(0).getValue(); |
| builder.contributeGraphEdge(src, 0, tokenizeOp, 0); |
| } |
| |
| @Override |
| public boolean isMicroOperator() { |
| return false; |
| } |
| |
| @Override |
| public boolean expensiveThanMaterialization() { |
| return false; |
| } |
| } |