phoenix-core/src/main/java/org/apache/phoenix/compile/GroupByCompiler.java - phoenix - Git at Google

 /*
  * Licensed to the Apache Software Foundation (ASF) under one
  * or more contributor license agreements.  See the NOTICE file
  * distributed with this work for additional information
  * regarding copyright ownership.  The ASF licenses this file
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
  *
  * http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
 package org.apache.phoenix.compile;

 import java.sql.SQLException;
 import java.util.ArrayList;
 import java.util.Collections;
 import java.util.Comparator;
 import java.util.List;

 import net.jcip.annotations.Immutable;

 import org.apache.hadoop.hbase.util.Pair;
 import org.apache.phoenix.compile.OrderPreservingTracker.Info;
 import org.apache.phoenix.compile.OrderPreservingTracker.Ordering;
 import org.apache.phoenix.coprocessor.BaseScannerRegionObserver;
 import org.apache.phoenix.exception.SQLExceptionCode;
 import org.apache.phoenix.exception.SQLExceptionInfo;
 import org.apache.phoenix.expression.CoerceExpression;
 import org.apache.phoenix.expression.Expression;
 import org.apache.phoenix.parse.AliasedNode;
 import org.apache.phoenix.parse.DistinctCountParseNode;
 import org.apache.phoenix.parse.HintNode.Hint;
 import org.apache.phoenix.parse.ParseNode;
 import org.apache.phoenix.parse.SelectStatement;
 import org.apache.phoenix.schema.AmbiguousColumnException;
 import org.apache.phoenix.schema.ColumnNotFoundException;
 import org.apache.phoenix.schema.types.PDataType;
 import org.apache.phoenix.schema.types.PVarbinary;
 import org.apache.phoenix.util.IndexUtil;

 import com.google.common.collect.ImmutableList;
 import com.google.common.collect.Lists;

 /**
  *
  * Validates GROUP BY clause and builds a {@link GroupBy} instance to encapsulate the
  * group by expressions.
  *
  *
  * @since 0.1
  */
 public class GroupByCompiler {
     @Immutable
     public static class GroupBy {
         private final List<Expression> expressions;
         private final List<Expression> keyExpressions;
         private final boolean isOrderPreserving;
         private final int orderPreservingColumnCount;
         private final boolean isUngroupedAggregate;
         private final List<Info> orderPreservingTrackInfos;
         public static final GroupByCompiler.GroupBy EMPTY_GROUP_BY = new GroupBy(new GroupByBuilder()) {
             @Override
             public GroupBy compile(StatementContext context, QueryPlan innerQueryPlan, Expression whereExpression) throws SQLException {
                 return this;
             }

             @Override
             public void explain(List<String> planSteps, Integer limit) {
             }

             @Override
             public String getScanAttribName() {
                 return null;
             }
         };
         public static final GroupByCompiler.GroupBy UNGROUPED_GROUP_BY = new GroupBy(new GroupByBuilder().setIsOrderPreserving(true).setIsUngroupedAggregate(true)) {
             @Override
             public GroupBy compile(StatementContext context, QueryPlan innerQueryPlan, Expression whereExpression) throws SQLException {
                 return this;
             }

             @Override
             public void explain(List<String> planSteps, Integer limit) {
                 planSteps.add("    SERVER AGGREGATE INTO SINGLE ROW");
             }

             @Override
             public String getScanAttribName() {
                 return BaseScannerRegionObserver.UNGROUPED_AGG;
             }
         };

         private GroupBy(GroupByBuilder builder) {
             this.expressions = ImmutableList.copyOf(builder.expressions);
             this.keyExpressions = builder.expressions == builder.keyExpressions ?
                     this.expressions : builder.keyExpressions == null ? null :
                         ImmutableList.copyOf(builder.keyExpressions);
             this.isOrderPreserving = builder.isOrderPreserving;
             this.orderPreservingColumnCount = builder.orderPreservingColumnCount;
             this.isUngroupedAggregate = builder.isUngroupedAggregate;
             this.orderPreservingTrackInfos = builder.orderPreservingTrackInfos;
         }

         public List<Expression> getExpressions() {
             return expressions;
         }

         public List<Expression> getKeyExpressions() {
             return keyExpressions;
         }

         public String getScanAttribName() {
             if (isUngroupedAggregate) {
                 return BaseScannerRegionObserver.UNGROUPED_AGG;
             } else if (isOrderPreserving) {
                 return BaseScannerRegionObserver.KEY_ORDERED_GROUP_BY_EXPRESSIONS;
             } else {
                 return BaseScannerRegionObserver.UNORDERED_GROUP_BY_EXPRESSIONS;
             }
         }

         public boolean isEmpty() {
             return expressions.isEmpty();
         }

         public boolean isOrderPreserving() {
             return isOrderPreserving;
         }

         public boolean isUngroupedAggregate() {
             return isUngroupedAggregate;
         }

         public int getOrderPreservingColumnCount() {
             return orderPreservingColumnCount;
         }

         public List<Info> getOrderPreservingTrackInfos() {
             return orderPreservingTrackInfos;
         }

         public GroupBy compile(StatementContext context, QueryPlan innerQueryPlan, Expression whereExpression) throws SQLException {
             boolean isOrderPreserving = this.isOrderPreserving;
             int orderPreservingColumnCount = 0;
             if (isOrderPreserving) {
                 OrderPreservingTracker tracker = new OrderPreservingTracker(
                         context,
                         GroupBy.EMPTY_GROUP_BY,
                         Ordering.UNORDERED,
                         expressions.size(),
                         null,
                         innerQueryPlan,
                         whereExpression);
                 for (int i = 0; i < expressions.size(); i++) {
                     Expression expression = expressions.get(i);
                     tracker.track(expression);
                 }

                 // This is true if the GROUP BY is composed of only PK columns. We further check here that
                 // there are no "gaps" in the PK columns positions used (i.e. we start with the first PK
                 // column and use each subsequent one in PK order).
                 isOrderPreserving = tracker.isOrderPreserving();
                 orderPreservingColumnCount = tracker.getOrderPreservingColumnCount();
                 if(isOrderPreserving) {
                     //reorder the groupby expressions following pk columns
                     List<Info> orderPreservingTrackInfos = tracker.getOrderPreservingTrackInfos();
                     List<Expression> newExpressions = Info.extractExpressions(orderPreservingTrackInfos);
                     assert newExpressions.size() == expressions.size();
                     return new GroupBy.GroupByBuilder(this)
                                .setIsOrderPreserving(isOrderPreserving)
                                .setOrderPreservingColumnCount(orderPreservingColumnCount)
                                .setExpressions(newExpressions)
                                .setKeyExpressions(newExpressions)
                                .setOrderPreservingTrackInfos(orderPreservingTrackInfos)
                                .build();
                 }
             }

             if (isUngroupedAggregate) {
                 return new GroupBy.GroupByBuilder(this)
                            .setIsOrderPreserving(isOrderPreserving)
                            .setOrderPreservingColumnCount(orderPreservingColumnCount)
                            .build();
             }
             List<Expression> expressions = Lists.newArrayListWithExpectedSize(this.expressions.size());
             List<Expression> keyExpressions = expressions;
             List<Pair<Integer,Expression>> groupBys = Lists.newArrayListWithExpectedSize(this.expressions.size());
             for (int i = 0; i < this.expressions.size(); i++) {
                 Expression expression = this.expressions.get(i);
                 groupBys.add(new Pair<Integer,Expression>(i,expression));
             }
             /*
              * If we're not ordered along the PK axis, our coprocessor needs to collect all distinct groups within
              * a region, sort them, and hold on to them until the scan completes.
              * Put fixed length nullables at the end, so that we can represent null by the absence of the trailing
              * value in the group by key. If there is more than one, we'll need to convert the ones not at the end
              * into a Decimal so that we can use an empty byte array as our representation for null (which correctly
              * maintains the sort order). We convert the Decimal back to the appropriate type (Integer or Long) when
              * it's retrieved from the result set.
              *
              * More specifically, order into the following buckets:
              *   1) non nullable fixed width
              *   2) variable width
              *   3) nullable fixed width
              * Within each bucket, order based on the column position in the schema. Putting the fixed width values
              * in the beginning optimizes access to subsequent values.
              */
             Collections.sort(groupBys, new Comparator<Pair<Integer,Expression>>() {
                 @Override
                 public int compare(Pair<Integer,Expression> gb1, Pair<Integer,Expression> gb2) {
                     Expression e1 = gb1.getSecond();
                     Expression e2 = gb2.getSecond();
                     PDataType t1 = e1.getDataType();
                     PDataType t2 = e2.getDataType();
                     boolean isFixed1 = t1.isFixedWidth();
                     boolean isFixed2 = t2.isFixedWidth();
                     boolean isFixedNullable1 = e1.isNullable() &&isFixed1;
                     boolean isFixedNullable2 = e2.isNullable() && isFixed2;
                     boolean oae1 = onlyAtEndType(e1);
                     boolean oae2 = onlyAtEndType(e2);
                     if (oae1 == oae2) {
                         if (isFixedNullable1 == isFixedNullable2) {
                             if (isFixed1 == isFixed2) {
                                 // Not strictly necessary, but forces the order to match the schema
                                 // column order (with PK columns before value columns).
                                 //return o1.getColumnPosition() - o2.getColumnPosition();
                                 return gb1.getFirst() - gb2.getFirst();
                             } else if (isFixed1) {
                                 return -1;
                             } else {
                                 return 1;
                             }
                         } else if (isFixedNullable1) {
                             return 1;
                         } else {
                             return -1;
                         }
                     } else if (oae1) {
                         return 1;
                     } else {
                         return -1;
                     }
                 }
             });
             boolean foundOnlyAtEndType = false;
             for (Pair<Integer,Expression> groupBy : groupBys) {
                 Expression e = groupBy.getSecond();
                 if (onlyAtEndType(e)) {
                     if (foundOnlyAtEndType) {
                         throw new SQLExceptionInfo.Builder(SQLExceptionCode.UNSUPPORTED_GROUP_BY_EXPRESSIONS)
                         .setMessage(e.toString()).build().buildException();
                     }
                     foundOnlyAtEndType  = true;
                 }
                 expressions.add(e);
             }
             for (int i = expressions.size()-2; i >= 0; i--) {
                 Expression expression = expressions.get(i);
                 PDataType keyType = getGroupByDataType(expression);
                 if (keyType == expression.getDataType()) {
                     continue;
                 }
                 // Copy expressions only when keyExpressions will be different than expressions
                 if (keyExpressions == expressions) {
                     keyExpressions = new ArrayList<Expression>(expressions);
                 }
                 // Wrap expression in an expression that coerces the expression to the required type..
                 // This is done so that we have a way of expressing null as an empty key when more
                 // than one fixed and nullable types are used in a group by clause
                 keyExpressions.set(i, CoerceExpression.create(expression, keyType));
             }

             GroupBy groupBy = new GroupBy.GroupByBuilder().setIsOrderPreserving(isOrderPreserving).setExpressions(expressions).setKeyExpressions(keyExpressions).build();
             return groupBy;
         }

         public static class GroupByBuilder {
             private boolean isOrderPreserving;
             private int orderPreservingColumnCount;
             private List<Expression> expressions = Collections.emptyList();
             private List<Expression> keyExpressions = Collections.emptyList();
             private boolean isUngroupedAggregate;
             private List<Info> orderPreservingTrackInfos = Collections.emptyList();

             public GroupByBuilder() {
             }

             public GroupByBuilder(GroupBy groupBy) {
                 this.isOrderPreserving = groupBy.isOrderPreserving;
                 this.orderPreservingColumnCount = groupBy.orderPreservingColumnCount;
                 this.expressions = groupBy.expressions;
                 this.keyExpressions = groupBy.keyExpressions;
                 this.isUngroupedAggregate = groupBy.isUngroupedAggregate;
             }

             public GroupByBuilder setExpressions(List<Expression> expressions) {
                 this.expressions = expressions;
                 return this;
             }

             public GroupByBuilder setKeyExpressions(List<Expression> keyExpressions) {
                 this.keyExpressions = keyExpressions;
                 return this;
             }

             public GroupByBuilder setIsOrderPreserving(boolean isOrderPreserving) {
                 this.isOrderPreserving = isOrderPreserving;
                 return this;
             }

             public GroupByBuilder setIsUngroupedAggregate(boolean isUngroupedAggregate) {
                 this.isUngroupedAggregate = isUngroupedAggregate;
                 return this;
             }

             public GroupByBuilder setOrderPreservingColumnCount(int orderPreservingColumnCount) {
                 this.orderPreservingColumnCount = orderPreservingColumnCount;
                 return this;
             }

             public GroupByBuilder setOrderPreservingTrackInfos(List<Info> orderPreservingTrackInfos) {
                 this.orderPreservingTrackInfos = orderPreservingTrackInfos;
                 return this;
             }

             public GroupBy build() {
                 return new GroupBy(this);
             }
         }

         public void explain(List<String> planSteps, Integer limit) {
             if (isUngroupedAggregate) {
                 planSteps.add("    SERVER AGGREGATE INTO SINGLE ROW");
             } else if (isOrderPreserving) {
                 planSteps.add("    SERVER AGGREGATE INTO ORDERED DISTINCT ROWS BY " + getExpressions() + (limit == null ? "" : " LIMIT " + limit + " GROUP" + (limit.intValue() == 1 ? "" : "S")));
             } else {
                 planSteps.add("    SERVER AGGREGATE INTO DISTINCT ROWS BY " + getExpressions() + (limit == null ? "" : " LIMIT " + limit + " GROUP" + (limit.intValue() == 1 ? "" : "S")));
             }
         }
     }

     /**
      * Get list of columns in the GROUP BY clause.
      * @param context query context kept between compilation of different query clauses
      * @param statement SQL statement being compiled
      * @return the {@link GroupBy} instance encapsulating the group by clause
      * @throws ColumnNotFoundException if column name could not be resolved
      * @throws AmbiguousColumnException if an unaliased column name is ambiguous across multiple tables
      */
     public static GroupBy compile(StatementContext context, SelectStatement statement) throws SQLException {
         List<ParseNode> groupByNodes = statement.getGroupBy();
         /**
          * Distinct can use an aggregate plan if there's no group by.
          * Otherwise, we need to insert a step after the Merge that dedups.
          * Order by only allowed on columns in the select distinct
          */
         boolean isUngroupedAggregate = false;
         if (groupByNodes.isEmpty()) {
             if (statement.isAggregate()) {
                 // do not optimize if
                 // 1. we were asked not to optimize
                 // 2. there's any HAVING clause
                 // TODO: PHOENIX-2989 suggests some ways to optimize the latter case
                 if (statement.getHint().hasHint(Hint.RANGE_SCAN) ||
                         statement.getHaving() != null) {
                     return GroupBy.UNGROUPED_GROUP_BY;
                 }
                 groupByNodes = Lists.newArrayListWithExpectedSize(statement.getSelect().size());
                 for (AliasedNode aliasedNode : statement.getSelect()) {
                     if (aliasedNode.getNode() instanceof DistinctCountParseNode) {
                         // only add children of DistinctCount nodes
                         groupByNodes.addAll(aliasedNode.getNode().getChildren());
                     } else {
                         // if we found anything else, do not attempt any further optimization
                         return GroupBy.UNGROUPED_GROUP_BY;
                     }
                 }
                 isUngroupedAggregate = true;
             } else if (statement.isDistinct()) {
                 groupByNodes = Lists.newArrayListWithExpectedSize(statement.getSelect().size());
                 for (AliasedNode aliasedNode : statement.getSelect()) {
                     // for distinct at all select expression as group by conditions
                     groupByNodes.add(aliasedNode.getNode());
                 }
             } else {
                 return GroupBy.EMPTY_GROUP_BY;
             }
         }

        // Accumulate expressions in GROUP BY
         ExpressionCompiler compiler =
                 new ExpressionCompiler(context, GroupBy.EMPTY_GROUP_BY);
         List<Expression> expressions = Lists.newArrayListWithExpectedSize(groupByNodes.size());
         for (int i = 0; i < groupByNodes.size(); i++) {
             ParseNode node = groupByNodes.get(i);
             Expression expression = node.accept(compiler);
             if (!expression.isStateless()) {
                 if (compiler.isAggregate()) {
                     throw new SQLExceptionInfo.Builder(SQLExceptionCode.AGGREGATE_IN_GROUP_BY)
                         .setMessage(expression.toString()).build().buildException();
                 }
                 expressions.add(expression);
             }
             compiler.reset();
         }

         if (expressions.isEmpty()) {
             return GroupBy.EMPTY_GROUP_BY;
         }
         GroupBy groupBy = new GroupBy.GroupByBuilder()
                 .setIsOrderPreserving(OrderByCompiler.isTrackOrderByPreserving(statement))
                 .setExpressions(expressions).setKeyExpressions(expressions)
                 .setIsUngroupedAggregate(isUngroupedAggregate).build();
         return groupBy;
     }

     private static boolean onlyAtEndType(Expression expression) {
         // Due to the encoding schema of these types, they may only be
         // used once in a group by and are located at the end of the
         // group by row key.
         PDataType type = getGroupByDataType(expression);
         return type.isArrayType() || type == PVarbinary.INSTANCE;
     }

     private static PDataType getGroupByDataType(Expression expression) {
         return IndexUtil.getIndexColumnDataType(expression.isNullable(), expression.getDataType());
     }

     private GroupByCompiler() {
     }
 }
	/*
	* Licensed to the Apache Software Foundation (ASF) under one
	* or more contributor license agreements. See the NOTICE file
	* distributed with this work for additional information
	* regarding copyright ownership. The ASF licenses this file
	* to you under the Apache License, Version 2.0 (the
	* "License"); you may not use this file except in compliance
	* with the License. You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing, software
	* distributed under the License is distributed on an "AS IS" BASIS,
	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	* See the License for the specific language governing permissions and
	* limitations under the License.
	*/
	package org.apache.phoenix.compile;

	import java.sql.SQLException;
	import java.util.ArrayList;
	import java.util.Collections;
	import java.util.Comparator;
	import java.util.List;

	import net.jcip.annotations.Immutable;

	import org.apache.hadoop.hbase.util.Pair;
	import org.apache.phoenix.compile.OrderPreservingTracker.Info;
	import org.apache.phoenix.compile.OrderPreservingTracker.Ordering;
	import org.apache.phoenix.coprocessor.BaseScannerRegionObserver;
	import org.apache.phoenix.exception.SQLExceptionCode;
	import org.apache.phoenix.exception.SQLExceptionInfo;
	import org.apache.phoenix.expression.CoerceExpression;
	import org.apache.phoenix.expression.Expression;
	import org.apache.phoenix.parse.AliasedNode;
	import org.apache.phoenix.parse.DistinctCountParseNode;
	import org.apache.phoenix.parse.HintNode.Hint;
	import org.apache.phoenix.parse.ParseNode;
	import org.apache.phoenix.parse.SelectStatement;
	import org.apache.phoenix.schema.AmbiguousColumnException;
	import org.apache.phoenix.schema.ColumnNotFoundException;
	import org.apache.phoenix.schema.types.PDataType;
	import org.apache.phoenix.schema.types.PVarbinary;
	import org.apache.phoenix.util.IndexUtil;

	import com.google.common.collect.ImmutableList;
	import com.google.common.collect.Lists;

	/**
	*
	* Validates GROUP BY clause and builds a {@link GroupBy} instance to encapsulate the
	* group by expressions.
	*
	*
	* @since 0.1
	*/
	public class GroupByCompiler {
	@Immutable
	public static class GroupBy {
	private final List<Expression> expressions;
	private final List<Expression> keyExpressions;
	private final boolean isOrderPreserving;
	private final int orderPreservingColumnCount;
	private final boolean isUngroupedAggregate;
	private final List<Info> orderPreservingTrackInfos;
	public static final GroupByCompiler.GroupBy EMPTY_GROUP_BY = new GroupBy(new GroupByBuilder()) {
	@Override
	public GroupBy compile(StatementContext context, QueryPlan innerQueryPlan, Expression whereExpression) throws SQLException {
	return this;
	}

	@Override
	public void explain(List<String> planSteps, Integer limit) {
	}

	@Override
	public String getScanAttribName() {
	return null;
	}
	};
	public static final GroupByCompiler.GroupBy UNGROUPED_GROUP_BY = new GroupBy(new GroupByBuilder().setIsOrderPreserving(true).setIsUngroupedAggregate(true)) {
	@Override
	public GroupBy compile(StatementContext context, QueryPlan innerQueryPlan, Expression whereExpression) throws SQLException {
	return this;
	}

	@Override
	public void explain(List<String> planSteps, Integer limit) {
	planSteps.add(" SERVER AGGREGATE INTO SINGLE ROW");
	}

	@Override
	public String getScanAttribName() {
	return BaseScannerRegionObserver.UNGROUPED_AGG;
	}
	};

	private GroupBy(GroupByBuilder builder) {
	this.expressions = ImmutableList.copyOf(builder.expressions);
	this.keyExpressions = builder.expressions == builder.keyExpressions ?
	this.expressions : builder.keyExpressions == null ? null :
	ImmutableList.copyOf(builder.keyExpressions);
	this.isOrderPreserving = builder.isOrderPreserving;
	this.orderPreservingColumnCount = builder.orderPreservingColumnCount;
	this.isUngroupedAggregate = builder.isUngroupedAggregate;
	this.orderPreservingTrackInfos = builder.orderPreservingTrackInfos;
	}

	public List<Expression> getExpressions() {
	return expressions;
	}

	public List<Expression> getKeyExpressions() {
	return keyExpressions;
	}

	public String getScanAttribName() {
	if (isUngroupedAggregate) {
	return BaseScannerRegionObserver.UNGROUPED_AGG;
	} else if (isOrderPreserving) {
	return BaseScannerRegionObserver.KEY_ORDERED_GROUP_BY_EXPRESSIONS;
	} else {
	return BaseScannerRegionObserver.UNORDERED_GROUP_BY_EXPRESSIONS;
	}
	}

	public boolean isEmpty() {
	return expressions.isEmpty();
	}

	public boolean isOrderPreserving() {
	return isOrderPreserving;
	}

	public boolean isUngroupedAggregate() {
	return isUngroupedAggregate;
	}

	public int getOrderPreservingColumnCount() {
	return orderPreservingColumnCount;
	}

	public List<Info> getOrderPreservingTrackInfos() {
	return orderPreservingTrackInfos;
	}

	public GroupBy compile(StatementContext context, QueryPlan innerQueryPlan, Expression whereExpression) throws SQLException {
	boolean isOrderPreserving = this.isOrderPreserving;
	int orderPreservingColumnCount = 0;
	if (isOrderPreserving) {
	OrderPreservingTracker tracker = new OrderPreservingTracker(
	context,
	GroupBy.EMPTY_GROUP_BY,
	Ordering.UNORDERED,
	expressions.size(),
	null,
	innerQueryPlan,
	whereExpression);
	for (int i = 0; i < expressions.size(); i++) {
	Expression expression = expressions.get(i);
	tracker.track(expression);
	}

	// This is true if the GROUP BY is composed of only PK columns. We further check here that
	// there are no "gaps" in the PK columns positions used (i.e. we start with the first PK
	// column and use each subsequent one in PK order).
	isOrderPreserving = tracker.isOrderPreserving();
	orderPreservingColumnCount = tracker.getOrderPreservingColumnCount();
	if(isOrderPreserving) {
	//reorder the groupby expressions following pk columns
	List<Info> orderPreservingTrackInfos = tracker.getOrderPreservingTrackInfos();
	List<Expression> newExpressions = Info.extractExpressions(orderPreservingTrackInfos);
	assert newExpressions.size() == expressions.size();
	return new GroupBy.GroupByBuilder(this)
	.setIsOrderPreserving(isOrderPreserving)
	.setOrderPreservingColumnCount(orderPreservingColumnCount)
	.setExpressions(newExpressions)
	.setKeyExpressions(newExpressions)
	.setOrderPreservingTrackInfos(orderPreservingTrackInfos)
	.build();
	}
	}

	if (isUngroupedAggregate) {
	return new GroupBy.GroupByBuilder(this)
	.setIsOrderPreserving(isOrderPreserving)
	.setOrderPreservingColumnCount(orderPreservingColumnCount)
	.build();
	}
	List<Expression> expressions = Lists.newArrayListWithExpectedSize(this.expressions.size());
	List<Expression> keyExpressions = expressions;
	List<Pair<Integer,Expression>> groupBys = Lists.newArrayListWithExpectedSize(this.expressions.size());
	for (int i = 0; i < this.expressions.size(); i++) {
	Expression expression = this.expressions.get(i);
	groupBys.add(new Pair<Integer,Expression>(i,expression));
	}
	/*
	* If we're not ordered along the PK axis, our coprocessor needs to collect all distinct groups within
	* a region, sort them, and hold on to them until the scan completes.
	* Put fixed length nullables at the end, so that we can represent null by the absence of the trailing
	* value in the group by key. If there is more than one, we'll need to convert the ones not at the end
	* into a Decimal so that we can use an empty byte array as our representation for null (which correctly
	* maintains the sort order). We convert the Decimal back to the appropriate type (Integer or Long) when
	* it's retrieved from the result set.
	*
	* More specifically, order into the following buckets:
	* 1) non nullable fixed width
	* 2) variable width
	* 3) nullable fixed width
	* Within each bucket, order based on the column position in the schema. Putting the fixed width values
	* in the beginning optimizes access to subsequent values.
	*/
	Collections.sort(groupBys, new Comparator<Pair<Integer,Expression>>() {
	@Override
	public int compare(Pair<Integer,Expression> gb1, Pair<Integer,Expression> gb2) {
	Expression e1 = gb1.getSecond();
	Expression e2 = gb2.getSecond();
	PDataType t1 = e1.getDataType();
	PDataType t2 = e2.getDataType();
	boolean isFixed1 = t1.isFixedWidth();
	boolean isFixed2 = t2.isFixedWidth();
	boolean isFixedNullable1 = e1.isNullable() &&isFixed1;
	boolean isFixedNullable2 = e2.isNullable() && isFixed2;
	boolean oae1 = onlyAtEndType(e1);
	boolean oae2 = onlyAtEndType(e2);
	if (oae1 == oae2) {
	if (isFixedNullable1 == isFixedNullable2) {
	if (isFixed1 == isFixed2) {
	// Not strictly necessary, but forces the order to match the schema
	// column order (with PK columns before value columns).
	//return o1.getColumnPosition() - o2.getColumnPosition();
	return gb1.getFirst() - gb2.getFirst();
	} else if (isFixed1) {
	return -1;
	} else {
	return 1;
	}
	} else if (isFixedNullable1) {
	return 1;
	} else {
	return -1;
	}
	} else if (oae1) {
	return 1;
	} else {
	return -1;
	}
	}
	});
	boolean foundOnlyAtEndType = false;
	for (Pair<Integer,Expression> groupBy : groupBys) {
	Expression e = groupBy.getSecond();
	if (onlyAtEndType(e)) {
	if (foundOnlyAtEndType) {
	throw new SQLExceptionInfo.Builder(SQLExceptionCode.UNSUPPORTED_GROUP_BY_EXPRESSIONS)
	.setMessage(e.toString()).build().buildException();
	}
	foundOnlyAtEndType = true;
	}
	expressions.add(e);
	}
	for (int i = expressions.size()-2; i >= 0; i--) {
	Expression expression = expressions.get(i);
	PDataType keyType = getGroupByDataType(expression);
	if (keyType == expression.getDataType()) {
	continue;
	}
	// Copy expressions only when keyExpressions will be different than expressions
	if (keyExpressions == expressions) {
	keyExpressions = new ArrayList<Expression>(expressions);
	}
	// Wrap expression in an expression that coerces the expression to the required type..
	// This is done so that we have a way of expressing null as an empty key when more
	// than one fixed and nullable types are used in a group by clause
	keyExpressions.set(i, CoerceExpression.create(expression, keyType));
	}

	GroupBy groupBy = new GroupBy.GroupByBuilder().setIsOrderPreserving(isOrderPreserving).setExpressions(expressions).setKeyExpressions(keyExpressions).build();
	return groupBy;
	}

	public static class GroupByBuilder {
	private boolean isOrderPreserving;
	private int orderPreservingColumnCount;
	private List<Expression> expressions = Collections.emptyList();
	private List<Expression> keyExpressions = Collections.emptyList();
	private boolean isUngroupedAggregate;
	private List<Info> orderPreservingTrackInfos = Collections.emptyList();

	public GroupByBuilder() {
	}

	public GroupByBuilder(GroupBy groupBy) {
	this.isOrderPreserving = groupBy.isOrderPreserving;
	this.orderPreservingColumnCount = groupBy.orderPreservingColumnCount;
	this.expressions = groupBy.expressions;
	this.keyExpressions = groupBy.keyExpressions;
	this.isUngroupedAggregate = groupBy.isUngroupedAggregate;
	}

	public GroupByBuilder setExpressions(List<Expression> expressions) {
	this.expressions = expressions;
	return this;
	}

	public GroupByBuilder setKeyExpressions(List<Expression> keyExpressions) {
	this.keyExpressions = keyExpressions;
	return this;
	}

	public GroupByBuilder setIsOrderPreserving(boolean isOrderPreserving) {
	this.isOrderPreserving = isOrderPreserving;
	return this;
	}

	public GroupByBuilder setIsUngroupedAggregate(boolean isUngroupedAggregate) {
	this.isUngroupedAggregate = isUngroupedAggregate;
	return this;
	}

	public GroupByBuilder setOrderPreservingColumnCount(int orderPreservingColumnCount) {
	this.orderPreservingColumnCount = orderPreservingColumnCount;
	return this;
	}

	public GroupByBuilder setOrderPreservingTrackInfos(List<Info> orderPreservingTrackInfos) {
	this.orderPreservingTrackInfos = orderPreservingTrackInfos;
	return this;
	}

	public GroupBy build() {
	return new GroupBy(this);
	}
	}

	public void explain(List<String> planSteps, Integer limit) {
	if (isUngroupedAggregate) {
	planSteps.add(" SERVER AGGREGATE INTO SINGLE ROW");
	} else if (isOrderPreserving) {
	planSteps.add(" SERVER AGGREGATE INTO ORDERED DISTINCT ROWS BY " + getExpressions() + (limit == null ? "" : " LIMIT " + limit + " GROUP" + (limit.intValue() == 1 ? "" : "S")));
	} else {
	planSteps.add(" SERVER AGGREGATE INTO DISTINCT ROWS BY " + getExpressions() + (limit == null ? "" : " LIMIT " + limit + " GROUP" + (limit.intValue() == 1 ? "" : "S")));
	}
	}
	}

	/**
	* Get list of columns in the GROUP BY clause.
	* @param context query context kept between compilation of different query clauses
	* @param statement SQL statement being compiled
	* @return the {@link GroupBy} instance encapsulating the group by clause
	* @throws ColumnNotFoundException if column name could not be resolved
	* @throws AmbiguousColumnException if an unaliased column name is ambiguous across multiple tables
	*/
	public static GroupBy compile(StatementContext context, SelectStatement statement) throws SQLException {
	List<ParseNode> groupByNodes = statement.getGroupBy();
	/**
	* Distinct can use an aggregate plan if there's no group by.
	* Otherwise, we need to insert a step after the Merge that dedups.
	* Order by only allowed on columns in the select distinct
	*/
	boolean isUngroupedAggregate = false;
	if (groupByNodes.isEmpty()) {
	if (statement.isAggregate()) {
	// do not optimize if
	// 1. we were asked not to optimize
	// 2. there's any HAVING clause
	// TODO: PHOENIX-2989 suggests some ways to optimize the latter case
	if (statement.getHint().hasHint(Hint.RANGE_SCAN) \|\|
	statement.getHaving() != null) {
	return GroupBy.UNGROUPED_GROUP_BY;
	}
	groupByNodes = Lists.newArrayListWithExpectedSize(statement.getSelect().size());
	for (AliasedNode aliasedNode : statement.getSelect()) {
	if (aliasedNode.getNode() instanceof DistinctCountParseNode) {
	// only add children of DistinctCount nodes
	groupByNodes.addAll(aliasedNode.getNode().getChildren());
	} else {
	// if we found anything else, do not attempt any further optimization
	return GroupBy.UNGROUPED_GROUP_BY;
	}
	}
	isUngroupedAggregate = true;
	} else if (statement.isDistinct()) {
	groupByNodes = Lists.newArrayListWithExpectedSize(statement.getSelect().size());
	for (AliasedNode aliasedNode : statement.getSelect()) {
	// for distinct at all select expression as group by conditions
	groupByNodes.add(aliasedNode.getNode());
	}
	} else {
	return GroupBy.EMPTY_GROUP_BY;
	}
	}

	// Accumulate expressions in GROUP BY
	ExpressionCompiler compiler =
	new ExpressionCompiler(context, GroupBy.EMPTY_GROUP_BY);
	List<Expression> expressions = Lists.newArrayListWithExpectedSize(groupByNodes.size());
	for (int i = 0; i < groupByNodes.size(); i++) {
	ParseNode node = groupByNodes.get(i);
	Expression expression = node.accept(compiler);
	if (!expression.isStateless()) {
	if (compiler.isAggregate()) {
	throw new SQLExceptionInfo.Builder(SQLExceptionCode.AGGREGATE_IN_GROUP_BY)
	.setMessage(expression.toString()).build().buildException();
	}
	expressions.add(expression);
	}
	compiler.reset();
	}

	if (expressions.isEmpty()) {
	return GroupBy.EMPTY_GROUP_BY;
	}
	GroupBy groupBy = new GroupBy.GroupByBuilder()
	.setIsOrderPreserving(OrderByCompiler.isTrackOrderByPreserving(statement))
	.setExpressions(expressions).setKeyExpressions(expressions)
	.setIsUngroupedAggregate(isUngroupedAggregate).build();
	return groupBy;
	}

	private static boolean onlyAtEndType(Expression expression) {
	// Due to the encoding schema of these types, they may only be
	// used once in a group by and are located at the end of the
	// group by row key.
	PDataType type = getGroupByDataType(expression);
	return type.isArrayType() \|\| type == PVarbinary.INSTANCE;
	}

	private static PDataType getGroupByDataType(Expression expression) {
	return IndexUtil.getIndexColumnDataType(expression.isNullable(), expression.getDataType());
	}

	private GroupByCompiler() {
	}
	}