blob: 7ea06140c24b47218fac69fc15003791493fe464 [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.vxquery.compiler.rewriter.rules;
import java.util.ArrayList;
import java.util.List;
import org.apache.commons.lang3.mutable.Mutable;
import org.apache.commons.lang3.mutable.MutableObject;
import org.apache.vxquery.compiler.rewriter.rules.util.ExpressionToolbox;
import org.apache.vxquery.functions.BuiltinOperators;
import org.apache.hyracks.algebricks.common.exceptions.AlgebricksException;
import org.apache.hyracks.algebricks.core.algebra.base.ILogicalExpression;
import org.apache.hyracks.algebricks.core.algebra.base.ILogicalOperator;
import org.apache.hyracks.algebricks.core.algebra.base.IOptimizationContext;
import org.apache.hyracks.algebricks.core.algebra.base.LogicalExpressionTag;
import org.apache.hyracks.algebricks.core.algebra.base.LogicalOperatorTag;
import org.apache.hyracks.algebricks.core.algebra.base.LogicalVariable;
import org.apache.hyracks.algebricks.core.algebra.expressions.AbstractFunctionCallExpression;
import org.apache.hyracks.algebricks.core.algebra.expressions.AggregateFunctionCallExpression;
import org.apache.hyracks.algebricks.core.algebra.expressions.UnnestingFunctionCallExpression;
import org.apache.hyracks.algebricks.core.algebra.expressions.VariableReferenceExpression;
import org.apache.hyracks.algebricks.core.algebra.functions.IFunctionInfo;
import org.apache.hyracks.algebricks.core.algebra.operators.logical.AbstractLogicalOperator;
import org.apache.hyracks.algebricks.core.algebra.operators.logical.AggregateOperator;
import org.apache.hyracks.algebricks.core.algebra.operators.logical.AssignOperator;
import org.apache.hyracks.algebricks.core.algebra.operators.logical.NestedTupleSourceOperator;
import org.apache.hyracks.algebricks.core.algebra.operators.logical.SubplanOperator;
import org.apache.hyracks.algebricks.core.algebra.operators.logical.UnnestOperator;
/**
* The rule searches for assign operators that have a xquery aggregate function.
* The aggregate function will be more efficient when used by an aggregate
* operator.
* XQuery aggregate functions are implemented in both scalar (one XDM Instance
* input as a sequence) and iterative (a stream of XDM Instances each one is
* single object).
*
* <pre>
* Before
*
* plan__parent
* ASSIGN( $v2 : sf1( $v0 ) )
* plan__child
*
* Where sf1 is a XQuery aggregate function expression (count, max, min,
* average, sum) with any supporting functions like treat, promote or data.
* The variable $v0 is defined in plan__child.
*
* After
*
* plan__parent
* SUBPLAN{
* AGGREGATE( $v2 : af1( $v1 ) )
* UNNEST( $v1 : iterate( $v0 ) )
* NESTEDTUPLESOURCE
* }
* plan__child
* </pre>
*
* @author prestonc
*/
public class ConvertAssignToAggregateRule extends AbstractVXQueryAggregateRule {
/**
* Find where an assign for a aggregate function is used before aggregate operator for a sequence.
* Search pattern 1: assign [function-call: count(function-call: treat($$))]
* Search pattern 2: $$ for aggregate [function-call: sequence()]
*/
@Override
public boolean rewritePre(Mutable<ILogicalOperator> opRef, IOptimizationContext context) throws AlgebricksException {
IFunctionInfo aggregateInfo;
AbstractFunctionCallExpression finalFunctionCall;
Mutable<ILogicalOperator> nextOperatorRef;
// Check if assign is for aggregate function.
AbstractLogicalOperator op = (AbstractLogicalOperator) opRef.getValue();
if (op.getOperatorTag() != LogicalOperatorTag.ASSIGN) {
return false;
}
AssignOperator assign = (AssignOperator) op;
Mutable<ILogicalExpression> mutableLogicalExpression = assign.getExpressions().get(0);
ILogicalExpression logicalExpression = mutableLogicalExpression.getValue();
if (logicalExpression.getExpressionTag() != LogicalExpressionTag.FUNCTION_CALL) {
return false;
}
AbstractFunctionCallExpression functionCall = (AbstractFunctionCallExpression) logicalExpression;
// TODO get the function through the function definition
aggregateInfo = getAggregateFunction(functionCall);
if (aggregateInfo == null) {
return false;
}
Mutable<ILogicalExpression> mutableVariableExpresion = ExpressionToolbox.findVariableExpression(mutableLogicalExpression);
if (mutableVariableExpresion == null) {
return false;
}
Mutable<ILogicalExpression> finalFunctionCallM = ExpressionToolbox
.findLastFunctionExpression(mutableLogicalExpression);
finalFunctionCall = (AbstractFunctionCallExpression) finalFunctionCallM.getValue();
// Build a subplan for replacing the sort distinct function with operators.
// Nested tuple source.
Mutable<ILogicalOperator> inputOperator = getInputOperator(assign.getInputs().get(0));
NestedTupleSourceOperator ntsOperator = new NestedTupleSourceOperator(inputOperator);
nextOperatorRef = new MutableObject<ILogicalOperator>(ntsOperator);
// Get variable that is being used for sort and distinct operators.
VariableReferenceExpression inputVariableRef = (VariableReferenceExpression) mutableVariableExpresion.getValue();
LogicalVariable inputVariable = inputVariableRef.getVariableReference();
// Unnest.
LogicalVariable unnestVariable = context.newVar();
UnnestOperator unnestOperator = getUnnestOperator(inputVariable, unnestVariable);
unnestOperator.getInputs().add(nextOperatorRef);
nextOperatorRef = new MutableObject<ILogicalOperator>(unnestOperator);
// Aggregate.
VariableReferenceExpression inputArg = new VariableReferenceExpression(unnestVariable);
finalFunctionCall.getArguments().get(0).setValue(inputArg);
Mutable<ILogicalExpression> aggregateArgs = functionCall.getArguments().get(0);
LogicalVariable aggregateVariable = assign.getVariables().get(0);
AggregateOperator aggregateOperator = getAggregateOperator(aggregateInfo, aggregateArgs, aggregateVariable);
aggregateOperator.getInputs().add(nextOperatorRef);
nextOperatorRef = new MutableObject<ILogicalOperator>(aggregateOperator);
// Subplan.
SubplanOperator subplanOperator = new SubplanOperator();
subplanOperator.getInputs().add(assign.getInputs().get(0));
subplanOperator.setRootOp(nextOperatorRef);
opRef.setValue(subplanOperator);
return true;
}
@Override
public boolean rewritePost(Mutable<ILogicalOperator> opRef, IOptimizationContext context) {
return false;
}
private AggregateOperator getAggregateOperator(IFunctionInfo aggregateFunction,
Mutable<ILogicalExpression> aggregateArgs, LogicalVariable aggregateVariable) {
List<LogicalVariable> aggregateVariables = new ArrayList<LogicalVariable>();
aggregateVariables.add(aggregateVariable);
List<Mutable<ILogicalExpression>> aggregateSequenceArgs = new ArrayList<Mutable<ILogicalExpression>>();
aggregateSequenceArgs.add(aggregateArgs);
List<Mutable<ILogicalExpression>> exprs = new ArrayList<Mutable<ILogicalExpression>>();
ILogicalExpression aggregateExp = new AggregateFunctionCallExpression(aggregateFunction, true,
aggregateSequenceArgs);
Mutable<ILogicalExpression> aggregateExpRef = new MutableObject<ILogicalExpression>(aggregateExp);
exprs.add(aggregateExpRef);
return new AggregateOperator(aggregateVariables, exprs);
}
private Mutable<ILogicalOperator> getInputOperator(Mutable<ILogicalOperator> opRef) {
AbstractLogicalOperator op = (AbstractLogicalOperator) opRef.getValue();
switch (op.getOperatorTag()) {
case SUBPLAN:
SubplanOperator subplan = (SubplanOperator) op;
return getInputOperator(subplan.getNestedPlans().get(0).getRoots().get(0));
case NESTEDTUPLESOURCE:
NestedTupleSourceOperator nts = (NestedTupleSourceOperator) op;
return getInputOperator(nts.getDataSourceReference());
default:
return opRef;
}
}
private UnnestOperator getUnnestOperator(LogicalVariable inputVariable, LogicalVariable unnestVariable) {
VariableReferenceExpression inputVre = new VariableReferenceExpression(inputVariable);
List<Mutable<ILogicalExpression>> iterateArgs = new ArrayList<Mutable<ILogicalExpression>>();
iterateArgs.add(new MutableObject<ILogicalExpression>(inputVre));
ILogicalExpression unnestExp = new UnnestingFunctionCallExpression(BuiltinOperators.ITERATE, iterateArgs);
Mutable<ILogicalExpression> unnestExpRef = new MutableObject<ILogicalExpression>(unnestExp);
return new UnnestOperator(unnestVariable, unnestExpRef);
}
}