| /* |
| * Licensed to the Apache Software Foundation (ASF) under one |
| * or more contributor license agreements. See the NOTICE file |
| * distributed with this work for additional information |
| * regarding copyright ownership. The ASF licenses this file |
| * to you under the Apache License, Version 2.0 (the |
| * "License"); you may not use this file except in compliance |
| * with the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| package org.apache.flink.table.plan.nodes.dataset |
| |
| import org.apache.calcite.plan.{RelOptCluster, RelOptCost, RelOptPlanner, RelTraitSet} |
| import org.apache.calcite.rel.`type`.RelDataType |
| import org.apache.calcite.rel.core.AggregateCall |
| import org.apache.calcite.rel.metadata.RelMetadataQuery |
| import org.apache.calcite.rel.{RelNode, RelWriter, SingleRel} |
| import org.apache.flink.api.common.typeinfo.TypeInformation |
| import org.apache.flink.api.java.DataSet |
| import org.apache.flink.api.java.typeutils.RowTypeInfo |
| import org.apache.flink.table.api.{BatchQueryConfig, BatchTableEnvironment} |
| import org.apache.flink.table.calcite.FlinkTypeFactory |
| import org.apache.flink.table.codegen.AggregationCodeGenerator |
| import org.apache.flink.table.plan.nodes.CommonAggregate |
| import org.apache.flink.table.runtime.aggregate.AggregateUtil.CalcitePair |
| import org.apache.flink.table.runtime.aggregate.{AggregateUtil, DataSetAggFunction, DataSetFinalAggFunction, DataSetPreAggFunction} |
| import org.apache.flink.types.Row |
| |
| /** |
| * Flink RelNode which matches along with a LogicalAggregate. |
| */ |
| class DataSetAggregate( |
| cluster: RelOptCluster, |
| traitSet: RelTraitSet, |
| inputNode: RelNode, |
| namedAggregates: Seq[CalcitePair[AggregateCall, String]], |
| rowRelDataType: RelDataType, |
| inputType: RelDataType, |
| grouping: Array[Int]) |
| extends SingleRel(cluster, traitSet, inputNode) with CommonAggregate with DataSetRel { |
| |
| override def deriveRowType(): RelDataType = rowRelDataType |
| |
| override def copy(traitSet: RelTraitSet, inputs: java.util.List[RelNode]): RelNode = { |
| new DataSetAggregate( |
| cluster, |
| traitSet, |
| inputs.get(0), |
| namedAggregates, |
| getRowType, |
| inputType, |
| grouping) |
| } |
| |
| override def toString: String = { |
| s"Aggregate(${ |
| if (!grouping.isEmpty) { |
| s"groupBy: (${groupingToString(inputType, grouping)}), " |
| } else { |
| "" |
| } |
| }select: (${aggregationToString(inputType, grouping, getRowType, namedAggregates, Nil)}))" |
| } |
| |
| override def explainTerms(pw: RelWriter): RelWriter = { |
| super.explainTerms(pw) |
| .itemIf("groupBy", groupingToString(inputType, grouping), !grouping.isEmpty) |
| .item("select", aggregationToString(inputType, grouping, getRowType, namedAggregates, Nil)) |
| } |
| |
| override def computeSelfCost(planner: RelOptPlanner, metadata: RelMetadataQuery): RelOptCost = { |
| |
| val child = this.getInput |
| val rowCnt = metadata.getRowCount(child) |
| val rowSize = this.estimateRowSize(child.getRowType) |
| val aggCnt = this.namedAggregates.size |
| planner.getCostFactory.makeCost(rowCnt, rowCnt * aggCnt, rowCnt * rowSize) |
| } |
| |
| override def translateToPlan( |
| tableEnv: BatchTableEnvironment, |
| queryConfig: BatchQueryConfig): DataSet[Row] = { |
| |
| val input = inputNode.asInstanceOf[DataSetRel] |
| val inputDS = input.translateToPlan(tableEnv, queryConfig) |
| |
| val rowTypeInfo = FlinkTypeFactory.toInternalRowTypeInfo(getRowType).asInstanceOf[RowTypeInfo] |
| |
| val generator = new AggregationCodeGenerator( |
| tableEnv.getConfig, |
| false, |
| inputDS.getType, |
| None) |
| |
| val ( |
| preAgg: Option[DataSetPreAggFunction], |
| preAggType: Option[TypeInformation[Row]], |
| finalAgg: Either[DataSetAggFunction, DataSetFinalAggFunction] |
| ) = AggregateUtil.createDataSetAggregateFunctions( |
| generator, |
| namedAggregates, |
| input.getRowType, |
| inputDS.getType.asInstanceOf[RowTypeInfo].getFieldTypes, |
| rowRelDataType, |
| grouping, |
| tableEnv.getConfig) |
| |
| val aggString = aggregationToString(inputType, grouping, getRowType, namedAggregates, Nil) |
| |
| if (grouping.length > 0) { |
| // grouped aggregation |
| val aggOpName = s"groupBy: (${groupingToString(inputType, grouping)}), " + |
| s"select: ($aggString)" |
| |
| if (preAgg.isDefined) { |
| inputDS |
| // pre-aggregation |
| .groupBy(grouping: _*) |
| .combineGroup(preAgg.get) |
| .returns(preAggType.get) |
| .name(aggOpName) |
| // final aggregation |
| .groupBy(grouping.indices: _*) |
| .reduceGroup(finalAgg.right.get) |
| .returns(rowTypeInfo) |
| .name(aggOpName) |
| } else { |
| inputDS |
| .groupBy(grouping: _*) |
| .reduceGroup(finalAgg.left.get) |
| .returns(rowTypeInfo) |
| .name(aggOpName) |
| } |
| } |
| else { |
| // global aggregation |
| val aggOpName = s"select:($aggString)" |
| |
| if (preAgg.isDefined) { |
| inputDS |
| // pre-aggregation |
| .mapPartition(preAgg.get) |
| .returns(preAggType.get) |
| .name(aggOpName) |
| // final aggregation |
| .reduceGroup(finalAgg.right.get) |
| .returns(rowTypeInfo) |
| .name(aggOpName) |
| } else { |
| inputDS |
| .mapPartition(finalAgg.left.get).setParallelism(1) |
| .returns(rowTypeInfo) |
| .name(aggOpName) |
| } |
| } |
| } |
| } |