| /* |
| * Licensed to the Apache Software Foundation (ASF) under one |
| * or more contributor license agreements. See the NOTICE file |
| * distributed with this work for additional information |
| * regarding copyright ownership. The ASF licenses this file |
| * to you under the Apache License, Version 2.0 (the |
| * "License"); you may not use this file except in compliance |
| * with the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, |
| * software distributed under the License is distributed on an |
| * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
| * KIND, either express or implied. See the License for the |
| * specific language governing permissions and limitations |
| * under the License. |
| */ |
| |
| package org.apache.iotdb.db.queryengine.plan.planner.plan.node.process; |
| |
| import org.apache.iotdb.db.queryengine.common.header.ColumnHeaderConstant; |
| import org.apache.iotdb.db.queryengine.plan.expression.Expression; |
| import org.apache.iotdb.db.queryengine.plan.planner.plan.node.PlanNode; |
| import org.apache.iotdb.db.queryengine.plan.planner.plan.node.PlanNodeId; |
| import org.apache.iotdb.db.queryengine.plan.planner.plan.node.PlanNodeType; |
| import org.apache.iotdb.db.queryengine.plan.planner.plan.node.PlanVisitor; |
| import org.apache.iotdb.db.queryengine.plan.planner.plan.node.source.SeriesAggregationSourceNode; |
| import org.apache.iotdb.db.queryengine.plan.planner.plan.parameter.AggregationDescriptor; |
| import org.apache.iotdb.db.queryengine.plan.planner.plan.parameter.GroupByParameter; |
| import org.apache.iotdb.db.queryengine.plan.planner.plan.parameter.GroupByTimeParameter; |
| import org.apache.iotdb.db.queryengine.plan.statement.component.Ordering; |
| |
| import org.apache.tsfile.utils.ReadWriteIOUtils; |
| |
| import javax.annotation.Nullable; |
| |
| import java.io.DataOutputStream; |
| import java.io.IOException; |
| import java.nio.ByteBuffer; |
| import java.util.ArrayList; |
| import java.util.Collections; |
| import java.util.HashMap; |
| import java.util.List; |
| import java.util.Map; |
| import java.util.Objects; |
| import java.util.stream.Collectors; |
| |
| /** |
| * This node is used to aggregate required series from multiple sources. The source data will be |
| * input as a TsBlock, it may be raw data or partial aggregation result. This node will output the |
| * final series aggregated result represented by TsBlock. |
| */ |
| public class AggregationNode extends MultiChildProcessNode { |
| |
| // The list of aggregate functions, each AggregateDescriptor will be output as one or two column |
| // of result TsBlock |
| protected List<AggregationDescriptor> aggregationDescriptorList; |
| |
| // The parameter of `group by time`. |
| // Its value will be null if there is no `group by time` clause. |
| @Nullable protected GroupByTimeParameter groupByTimeParameter; |
| |
| // The parameter of `group by`. |
| // Its value will be null if there is no `group by` clause. |
| @Nullable protected GroupByParameter groupByParameter; |
| |
| // In some situation of `group by` clause, groupByExpression is required. |
| // It will be null if the clause doesn't refer to any expression. |
| protected Expression groupByExpression; |
| |
| protected Ordering scanOrder; |
| |
| protected boolean outputEndTime = false; |
| |
| public AggregationNode( |
| PlanNodeId id, |
| List<AggregationDescriptor> aggregationDescriptorList, |
| @Nullable GroupByTimeParameter groupByTimeParameter, |
| Ordering scanOrder) { |
| super(id, new ArrayList<>()); |
| this.aggregationDescriptorList = getDeduplicatedDescriptors(aggregationDescriptorList); |
| this.groupByTimeParameter = groupByTimeParameter; |
| this.scanOrder = scanOrder; |
| } |
| |
| public AggregationNode( |
| PlanNodeId id, |
| List<PlanNode> children, |
| List<AggregationDescriptor> aggregationDescriptorList, |
| @Nullable GroupByTimeParameter groupByTimeParameter, |
| Ordering scanOrder) { |
| super(id, children); |
| this.aggregationDescriptorList = getDeduplicatedDescriptors(aggregationDescriptorList); |
| this.groupByTimeParameter = groupByTimeParameter; |
| this.scanOrder = scanOrder; |
| } |
| |
| public AggregationNode( |
| PlanNodeId id, |
| List<AggregationDescriptor> aggregationDescriptorList, |
| @Nullable GroupByTimeParameter groupByTimeParameter, |
| @Nullable GroupByParameter groupByParameter, |
| Expression groupByExpression, |
| boolean outputEndTime, |
| Ordering scanOrder) { |
| super(id, new ArrayList<>()); |
| this.aggregationDescriptorList = getDeduplicatedDescriptors(aggregationDescriptorList); |
| this.groupByTimeParameter = groupByTimeParameter; |
| this.scanOrder = scanOrder; |
| this.groupByParameter = groupByParameter; |
| this.groupByExpression = groupByExpression; |
| this.outputEndTime = outputEndTime; |
| } |
| |
| public AggregationNode( |
| PlanNodeId id, |
| List<PlanNode> children, |
| List<AggregationDescriptor> aggregationDescriptorList, |
| @Nullable GroupByTimeParameter groupByTimeParameter, |
| @Nullable GroupByParameter groupByParameter, |
| Expression groupByExpression, |
| boolean outputEndTime, |
| Ordering scanOrder) { |
| super(id, children); |
| this.aggregationDescriptorList = getDeduplicatedDescriptors(aggregationDescriptorList); |
| this.scanOrder = scanOrder; |
| this.groupByParameter = groupByParameter; |
| this.groupByTimeParameter = groupByTimeParameter; |
| this.groupByExpression = groupByExpression; |
| this.outputEndTime = outputEndTime; |
| } |
| |
| public List<AggregationDescriptor> getAggregationDescriptorList() { |
| return aggregationDescriptorList; |
| } |
| |
| @Nullable |
| public GroupByTimeParameter getGroupByTimeParameter() { |
| return groupByTimeParameter; |
| } |
| |
| @Nullable |
| public GroupByParameter getGroupByParameter() { |
| return groupByParameter; |
| } |
| |
| public Ordering getScanOrder() { |
| return scanOrder; |
| } |
| |
| public boolean isOutputEndTime() { |
| return outputEndTime; |
| } |
| |
| public void setOutputEndTime(boolean outputEndTime) { |
| this.outputEndTime = outputEndTime; |
| } |
| |
| @Nullable |
| public Expression getGroupByExpression() { |
| return groupByExpression; |
| } |
| |
| @Override |
| public PlanNodeType getType() { |
| return PlanNodeType.AGGREGATE; |
| } |
| |
| @Override |
| public PlanNode clone() { |
| return new AggregationNode( |
| getPlanNodeId(), |
| getAggregationDescriptorList(), |
| getGroupByTimeParameter(), |
| getGroupByParameter(), |
| getGroupByExpression(), |
| outputEndTime, |
| getScanOrder()); |
| } |
| |
| @Override |
| public PlanNode createSubNode(int subNodeId, int startIndex, int endIndex) { |
| return new HorizontallyConcatNode( |
| new PlanNodeId(String.format("%s-%s", getPlanNodeId(), subNodeId)), |
| new ArrayList<>(children.subList(startIndex, endIndex))); |
| } |
| |
| @Override |
| public List<String> getOutputColumnNames() { |
| List<String> outputColumnNames = new ArrayList<>(); |
| if (outputEndTime) { |
| outputColumnNames.add(ColumnHeaderConstant.ENDTIME); |
| } |
| outputColumnNames.addAll( |
| aggregationDescriptorList.stream() |
| .map(AggregationDescriptor::getOutputColumnNames) |
| .flatMap(List::stream) |
| .collect(Collectors.toList())); |
| |
| return outputColumnNames; |
| } |
| |
| public static List<SeriesAggregationSourceNode> findAggregationSourceNode(PlanNode node) { |
| if (node == null) { |
| return new ArrayList<>(); |
| } |
| if (node instanceof SeriesAggregationSourceNode) { |
| return Collections.singletonList((SeriesAggregationSourceNode) node); |
| } |
| List<SeriesAggregationSourceNode> ret = new ArrayList<>(); |
| node.getChildren().forEach(child -> ret.addAll(findAggregationSourceNode(child))); |
| return ret; |
| } |
| |
| @Override |
| public <R, C> R accept(PlanVisitor<R, C> visitor, C context) { |
| return visitor.visitAggregation(this, context); |
| } |
| |
| @Override |
| protected void serializeAttributes(ByteBuffer byteBuffer) { |
| PlanNodeType.AGGREGATE.serialize(byteBuffer); |
| ReadWriteIOUtils.write(aggregationDescriptorList.size(), byteBuffer); |
| for (AggregationDescriptor aggregationDescriptor : aggregationDescriptorList) { |
| aggregationDescriptor.serialize(byteBuffer); |
| } |
| if (groupByTimeParameter == null) { |
| ReadWriteIOUtils.write((byte) 0, byteBuffer); |
| } else { |
| ReadWriteIOUtils.write((byte) 1, byteBuffer); |
| groupByTimeParameter.serialize(byteBuffer); |
| } |
| if (groupByParameter == null) { |
| ReadWriteIOUtils.write((byte) 0, byteBuffer); |
| } else { |
| ReadWriteIOUtils.write((byte) 1, byteBuffer); |
| groupByParameter.serialize(byteBuffer); |
| } |
| if (groupByExpression == null) { |
| ReadWriteIOUtils.write((byte) 0, byteBuffer); |
| } else { |
| ReadWriteIOUtils.write((byte) 1, byteBuffer); |
| Expression.serialize(groupByExpression, byteBuffer); |
| } |
| ReadWriteIOUtils.write(outputEndTime, byteBuffer); |
| ReadWriteIOUtils.write(scanOrder.ordinal(), byteBuffer); |
| } |
| |
| @Override |
| protected void serializeAttributes(DataOutputStream stream) throws IOException { |
| PlanNodeType.AGGREGATE.serialize(stream); |
| ReadWriteIOUtils.write(aggregationDescriptorList.size(), stream); |
| for (AggregationDescriptor aggregationDescriptor : aggregationDescriptorList) { |
| aggregationDescriptor.serialize(stream); |
| } |
| if (groupByTimeParameter == null) { |
| ReadWriteIOUtils.write((byte) 0, stream); |
| } else { |
| ReadWriteIOUtils.write((byte) 1, stream); |
| groupByTimeParameter.serialize(stream); |
| } |
| if (groupByParameter == null) { |
| ReadWriteIOUtils.write((byte) 0, stream); |
| } else { |
| ReadWriteIOUtils.write((byte) 1, stream); |
| groupByParameter.serialize(stream); |
| } |
| if (groupByExpression == null) { |
| ReadWriteIOUtils.write((byte) 0, stream); |
| } else { |
| ReadWriteIOUtils.write((byte) 1, stream); |
| Expression.serialize(groupByExpression, stream); |
| } |
| ReadWriteIOUtils.write(outputEndTime, stream); |
| ReadWriteIOUtils.write(scanOrder.ordinal(), stream); |
| } |
| |
| public static AggregationNode deserialize(ByteBuffer byteBuffer) { |
| int descriptorSize = ReadWriteIOUtils.readInt(byteBuffer); |
| List<AggregationDescriptor> aggregationDescriptorList = new ArrayList<>(); |
| while (descriptorSize > 0) { |
| aggregationDescriptorList.add(AggregationDescriptor.deserialize(byteBuffer)); |
| descriptorSize--; |
| } |
| byte isNull = ReadWriteIOUtils.readByte(byteBuffer); |
| GroupByTimeParameter groupByTimeParameter = null; |
| if (isNull == 1) { |
| groupByTimeParameter = GroupByTimeParameter.deserialize(byteBuffer); |
| } |
| isNull = ReadWriteIOUtils.readByte(byteBuffer); |
| GroupByParameter groupByParameter = null; |
| if (isNull == 1) { |
| groupByParameter = GroupByParameter.deserialize(byteBuffer); |
| } |
| isNull = ReadWriteIOUtils.readByte(byteBuffer); |
| Expression groupByExpression = null; |
| if (isNull == 1) { |
| groupByExpression = Expression.deserialize(byteBuffer); |
| } |
| boolean outputEndTime = ReadWriteIOUtils.readBool(byteBuffer); |
| Ordering scanOrder = Ordering.values()[ReadWriteIOUtils.readInt(byteBuffer)]; |
| PlanNodeId planNodeId = PlanNodeId.deserialize(byteBuffer); |
| return new AggregationNode( |
| planNodeId, |
| aggregationDescriptorList, |
| groupByTimeParameter, |
| groupByParameter, |
| groupByExpression, |
| outputEndTime, |
| scanOrder); |
| } |
| |
| @Override |
| public boolean equals(Object o) { |
| if (this == o) { |
| return true; |
| } |
| if (o == null || getClass() != o.getClass()) { |
| return false; |
| } |
| if (!super.equals(o)) { |
| return false; |
| } |
| AggregationNode that = (AggregationNode) o; |
| return Objects.equals(aggregationDescriptorList, that.aggregationDescriptorList) |
| && Objects.equals(groupByTimeParameter, that.groupByTimeParameter) |
| && Objects.equals(groupByParameter, that.groupByParameter) |
| && Objects.equals(groupByExpression, that.groupByExpression) |
| && Objects.equals(outputEndTime, that.outputEndTime) |
| && scanOrder == that.scanOrder; |
| } |
| |
| @Override |
| public int hashCode() { |
| return Objects.hash( |
| super.hashCode(), |
| aggregationDescriptorList, |
| groupByTimeParameter, |
| groupByParameter, |
| groupByExpression, |
| outputEndTime, |
| scanOrder); |
| } |
| |
| /** |
| * If aggregation function COUNT and AVG for one time series appears at the same time, and outputs |
| * intermediate result, the output columns will be like | COUNT | COUNT | SUM |. In this |
| * situation, one COUNT column is not needed. Therefore, when COUNT(or SUM) appears with AVG and |
| * outputs intermediate result(if they output final result, they will be all necessary), we need |
| * to REMOVE the COUNT aggregation, and only keep AVG function no matter their appearing order. |
| * |
| * <p>The related functions include AVG(COUNT AND SUM), FIRST_VALUE(FIRST_VALUE AND MIN_TIME), |
| * LAST_VALUE(LAST_VALUE AND MAX_TIME). |
| */ |
| public static List<AggregationDescriptor> getDeduplicatedDescriptors( |
| List<AggregationDescriptor> aggregationDescriptors) { |
| Map<String, Integer> columnToIndexMap = new HashMap<>(); |
| boolean[] removedIndexes = new boolean[aggregationDescriptors.size()]; |
| for (int i = 0; i < aggregationDescriptors.size(); i++) { |
| AggregationDescriptor descriptor = aggregationDescriptors.get(i); |
| if (descriptor.getStep().isOutputPartial()) { |
| List<String> outputColumnNames = descriptor.getOutputColumnNames(); |
| for (String outputColumn : outputColumnNames) { |
| // if encountering repeated column |
| if (columnToIndexMap.containsKey(outputColumn)) { |
| // if self is double outputs, then remove the former, else remove self |
| if (outputColumnNames.size() == 2) { |
| removedIndexes[columnToIndexMap.get(outputColumn)] = true; |
| } else { |
| removedIndexes[i] = true; |
| } |
| } else { |
| columnToIndexMap.put(outputColumn, i); |
| } |
| } |
| } |
| } |
| List<AggregationDescriptor> deduplicatedDescriptors = new ArrayList<>(); |
| for (int i = 0; i < aggregationDescriptors.size(); i++) { |
| if (!removedIndexes[i]) { |
| deduplicatedDescriptors.add(aggregationDescriptors.get(i)); |
| } |
| } |
| return deduplicatedDescriptors; |
| } |
| |
| public String toString() { |
| return String.format("AggregationNode-%s", getPlanNodeId()); |
| } |
| } |