blob: 533e1c7ab348dae4cf14705548b1ef4b3136c92a [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
package org.apache.iotdb.db.utils;
import org.apache.iotdb.common.rpc.thrift.TAggregationType;
import org.apache.iotdb.commons.exception.MetadataException;
import org.apache.iotdb.commons.path.PartialPath;
import org.apache.iotdb.db.queryengine.plan.statement.component.Ordering;
import org.apache.iotdb.db.utils.constant.SqlConstant;
import org.apache.iotdb.tsfile.file.metadata.enums.TSDataType;
import org.apache.iotdb.tsfile.file.metadata.enums.TSEncoding;
import java.util.Arrays;
import java.util.Collections;
import java.util.EnumMap;
import java.util.HashSet;
import java.util.List;
import java.util.Map;
import java.util.Set;
import static org.apache.iotdb.db.queryengine.execution.operator.AggregationUtil.addPartialSuffix;
public class SchemaUtils {
private SchemaUtils() {}
private static final Map<TSDataType, Set<TSEncoding>> schemaChecker =
new EnumMap<>(TSDataType.class);
static {
Set<TSEncoding> booleanSet = new HashSet<>();
booleanSet.add(TSEncoding.PLAIN);
booleanSet.add(TSEncoding.RLE);
schemaChecker.put(TSDataType.BOOLEAN, booleanSet);
Set<TSEncoding> intSet = new HashSet<>();
intSet.add(TSEncoding.PLAIN);
intSet.add(TSEncoding.RLE);
intSet.add(TSEncoding.TS_2DIFF);
intSet.add(TSEncoding.GORILLA);
intSet.add(TSEncoding.ZIGZAG);
intSet.add(TSEncoding.CHIMP);
intSet.add(TSEncoding.SPRINTZ);
intSet.add(TSEncoding.RLBE);
schemaChecker.put(TSDataType.INT32, intSet);
schemaChecker.put(TSDataType.INT64, intSet);
Set<TSEncoding> floatSet = new HashSet<>();
floatSet.add(TSEncoding.PLAIN);
floatSet.add(TSEncoding.RLE);
floatSet.add(TSEncoding.TS_2DIFF);
floatSet.add(TSEncoding.GORILLA_V1);
floatSet.add(TSEncoding.GORILLA);
floatSet.add(TSEncoding.CHIMP);
floatSet.add(TSEncoding.SPRINTZ);
floatSet.add(TSEncoding.RLBE);
schemaChecker.put(TSDataType.FLOAT, floatSet);
schemaChecker.put(TSDataType.DOUBLE, floatSet);
Set<TSEncoding> textSet = new HashSet<>();
textSet.add(TSEncoding.PLAIN);
textSet.add(TSEncoding.DICTIONARY);
schemaChecker.put(TSDataType.TEXT, textSet);
}
/**
* If the datatype of 'aggregation' depends on 'measurementDataType' (min_value, max_value),
* return 'measurementDataType' directly, or return a list whose elements are all the datatype of
* 'aggregation' and its length is the same as 'measurementDataType'.
*
* @param measurementDataType raw measurement type
* @param aggregation aggregation type
* @return measurementDataType directly, or return a list whose elements are all the datatype of
* aggregation and its length is the same as 'measurementDataType'
*/
public static List<TSDataType> getAggregatedDataTypes(
List<TSDataType> measurementDataType, String aggregation) {
TSDataType dataType = getBuiltinAggregationTypeByFuncName(aggregation);
if (dataType != null) {
return Collections.nCopies(measurementDataType.size(), dataType);
}
return measurementDataType;
}
public static TSDataType getSeriesTypeByPath(PartialPath path, String aggregation) {
TSDataType dataType = getBuiltinAggregationTypeByFuncName(aggregation);
if (dataType != null) {
return dataType;
} else {
return path.getSeriesType();
}
}
/**
* @param aggregation aggregation function
* @return the data type of the aggregation or null if it aggregation is null
*/
public static TSDataType getBuiltinAggregationTypeByFuncName(String aggregation) {
if (aggregation == null) {
return null;
}
switch (aggregation.toLowerCase()) {
case SqlConstant.MIN_TIME:
case SqlConstant.MAX_TIME:
case SqlConstant.COUNT:
case SqlConstant.TIME_DURATION:
case SqlConstant.COUNT_TIME:
return TSDataType.INT64;
case SqlConstant.AVG:
case SqlConstant.SUM:
case SqlConstant.STDDEV:
case SqlConstant.STDDEV_POP:
case SqlConstant.STDDEV_SAMP:
case SqlConstant.VARIANCE:
case SqlConstant.VAR_POP:
case SqlConstant.VAR_SAMP:
return TSDataType.DOUBLE;
// Partial aggregation names
case SqlConstant.STDDEV + "_partial":
case SqlConstant.STDDEV_POP + "_partial":
case SqlConstant.STDDEV_SAMP + "_partial":
case SqlConstant.VARIANCE + "_partial":
case SqlConstant.VAR_POP + "_partial":
case SqlConstant.VAR_SAMP + "_partial":
case SqlConstant.MAX_BY + "_partial":
case SqlConstant.MIN_BY + "_partial":
return TSDataType.TEXT;
case SqlConstant.LAST_VALUE:
case SqlConstant.FIRST_VALUE:
case SqlConstant.MIN_VALUE:
case SqlConstant.MAX_VALUE:
case SqlConstant.MODE:
case SqlConstant.MAX_BY:
case SqlConstant.MIN_BY:
default:
return null;
}
}
/**
* Return aggregation function name by given function type. If aggregation type is UDAF, you shall
* acquire its name in other ways.
*
* @param aggregationType aggregation type
* @return the name of the aggregation or null if its aggregation type is null
*/
public static String getBuiltinAggregationName(TAggregationType aggregationType) {
if (aggregationType == null) {
return null;
}
switch (aggregationType) {
case COUNT:
return SqlConstant.COUNT;
case AVG:
return SqlConstant.AVG;
case SUM:
return SqlConstant.SUM;
case FIRST_VALUE:
return SqlConstant.FIRST_VALUE;
case LAST_VALUE:
return SqlConstant.LAST_VALUE;
case MAX_TIME:
return SqlConstant.MAX_TIME;
case MIN_TIME:
return SqlConstant.MIN_TIME;
case MAX_VALUE:
return SqlConstant.MAX_VALUE;
case MIN_VALUE:
return SqlConstant.MIN_VALUE;
case EXTREME:
return SqlConstant.EXTREME;
case COUNT_IF:
return SqlConstant.COUNT_IF;
case TIME_DURATION:
return SqlConstant.TIME_DURATION;
case MODE:
return SqlConstant.MODE;
case COUNT_TIME:
return SqlConstant.COUNT_TIME;
case STDDEV:
return SqlConstant.STDDEV;
case STDDEV_POP:
return SqlConstant.STDDEV_POP;
case STDDEV_SAMP:
return SqlConstant.STDDEV_SAMP;
case VARIANCE:
return SqlConstant.VARIANCE;
case VAR_POP:
return SqlConstant.VAR_POP;
case VAR_SAMP:
return SqlConstant.VAR_SAMP;
default:
return null;
}
}
/**
* judge whether the order of aggregation calculation is consistent with the order of traversing
* data
*/
public static boolean isConsistentWithScanOrder(
TAggregationType aggregationFunction, Ordering scanOrder) {
boolean ascending = scanOrder == Ordering.ASC;
switch (aggregationFunction) {
case MIN_TIME:
case FIRST_VALUE:
return ascending;
case MAX_TIME:
case LAST_VALUE:
return !ascending;
case SUM:
case MIN_VALUE:
case MAX_VALUE:
case EXTREME:
case COUNT:
case COUNT_TIME:
case AVG:
case TIME_DURATION:
case STDDEV:
case STDDEV_POP:
case STDDEV_SAMP:
case VARIANCE:
case VAR_POP:
case VAR_SAMP:
case MAX_BY:
case MIN_BY:
case UDAF:
return true;
default:
throw new IllegalArgumentException(
String.format("Invalid Aggregation function: %s", aggregationFunction));
}
}
public static void checkDataTypeWithEncoding(TSDataType dataType, TSEncoding encoding)
throws MetadataException {
if (!schemaChecker.get(dataType).contains(encoding)) {
throw new MetadataException(
String.format("encoding %s does not support %s", encoding, dataType), true);
}
}
public static List<String> splitPartialBuiltinAggregation(TAggregationType aggregationType) {
switch (aggregationType) {
case FIRST_VALUE:
return Collections.singletonList(SqlConstant.MIN_TIME);
case LAST_VALUE:
return Collections.singletonList(SqlConstant.MAX_TIME);
case STDDEV:
return Collections.singletonList(addPartialSuffix(SqlConstant.STDDEV));
case STDDEV_POP:
return Collections.singletonList(addPartialSuffix(SqlConstant.STDDEV_POP));
case STDDEV_SAMP:
return Collections.singletonList(addPartialSuffix(SqlConstant.STDDEV_SAMP));
case VARIANCE:
return Collections.singletonList(addPartialSuffix(SqlConstant.VARIANCE));
case VAR_POP:
return Collections.singletonList(addPartialSuffix(SqlConstant.VAR_POP));
case VAR_SAMP:
return Collections.singletonList(addPartialSuffix(SqlConstant.VAR_SAMP));
case MAX_BY:
return Collections.singletonList(addPartialSuffix(SqlConstant.MAX_BY));
case MIN_BY:
return Collections.singletonList(addPartialSuffix(SqlConstant.MIN_BY));
case AVG:
return Arrays.asList(SqlConstant.COUNT, SqlConstant.SUM);
case TIME_DURATION:
return Arrays.asList(SqlConstant.MAX_TIME, SqlConstant.MIN_TIME);
case SUM:
case MIN_VALUE:
case MAX_VALUE:
case EXTREME:
case COUNT:
case COUNT_TIME:
case MIN_TIME:
case MAX_TIME:
case COUNT_IF:
case MODE:
return Collections.emptyList();
default:
throw new IllegalArgumentException(
String.format("Invalid Aggregation function: %s", aggregationType));
}
}
}