| /* |
| * Licensed to the Apache Software Foundation (ASF) under one |
| * or more contributor license agreements. See the NOTICE file |
| * distributed with this work for additional information |
| * regarding copyright ownership. The ASF licenses this file |
| * to you under the Apache License, Version 2.0 (the |
| * "License"); you may not use this file except in compliance |
| * with the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, |
| * software distributed under the License is distributed on an |
| * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
| * KIND, either express or implied. See the License for the |
| * specific language governing permissions and limitations |
| * under the License. |
| */ |
| package org.apache.iotdb.db.utils; |
| |
| import org.apache.iotdb.common.rpc.thrift.TAggregationType; |
| import org.apache.iotdb.commons.exception.MetadataException; |
| import org.apache.iotdb.commons.path.PartialPath; |
| import org.apache.iotdb.db.queryengine.plan.statement.component.Ordering; |
| import org.apache.iotdb.db.utils.constant.SqlConstant; |
| import org.apache.iotdb.tsfile.file.metadata.enums.TSDataType; |
| import org.apache.iotdb.tsfile.file.metadata.enums.TSEncoding; |
| |
| import java.util.Arrays; |
| import java.util.Collections; |
| import java.util.EnumMap; |
| import java.util.HashSet; |
| import java.util.List; |
| import java.util.Map; |
| import java.util.Set; |
| |
| import static org.apache.iotdb.db.queryengine.execution.operator.AggregationUtil.addPartialSuffix; |
| |
| public class SchemaUtils { |
| |
| private SchemaUtils() {} |
| |
| private static final Map<TSDataType, Set<TSEncoding>> schemaChecker = |
| new EnumMap<>(TSDataType.class); |
| |
| static { |
| Set<TSEncoding> booleanSet = new HashSet<>(); |
| booleanSet.add(TSEncoding.PLAIN); |
| booleanSet.add(TSEncoding.RLE); |
| schemaChecker.put(TSDataType.BOOLEAN, booleanSet); |
| |
| Set<TSEncoding> intSet = new HashSet<>(); |
| intSet.add(TSEncoding.PLAIN); |
| intSet.add(TSEncoding.RLE); |
| intSet.add(TSEncoding.TS_2DIFF); |
| intSet.add(TSEncoding.GORILLA); |
| intSet.add(TSEncoding.ZIGZAG); |
| intSet.add(TSEncoding.CHIMP); |
| intSet.add(TSEncoding.SPRINTZ); |
| intSet.add(TSEncoding.RLBE); |
| |
| schemaChecker.put(TSDataType.INT32, intSet); |
| schemaChecker.put(TSDataType.INT64, intSet); |
| |
| Set<TSEncoding> floatSet = new HashSet<>(); |
| floatSet.add(TSEncoding.PLAIN); |
| floatSet.add(TSEncoding.RLE); |
| floatSet.add(TSEncoding.TS_2DIFF); |
| floatSet.add(TSEncoding.GORILLA_V1); |
| floatSet.add(TSEncoding.GORILLA); |
| floatSet.add(TSEncoding.CHIMP); |
| floatSet.add(TSEncoding.SPRINTZ); |
| floatSet.add(TSEncoding.RLBE); |
| |
| schemaChecker.put(TSDataType.FLOAT, floatSet); |
| schemaChecker.put(TSDataType.DOUBLE, floatSet); |
| |
| Set<TSEncoding> textSet = new HashSet<>(); |
| textSet.add(TSEncoding.PLAIN); |
| textSet.add(TSEncoding.DICTIONARY); |
| schemaChecker.put(TSDataType.TEXT, textSet); |
| } |
| |
| /** |
| * If the datatype of 'aggregation' depends on 'measurementDataType' (min_value, max_value), |
| * return 'measurementDataType' directly, or return a list whose elements are all the datatype of |
| * 'aggregation' and its length is the same as 'measurementDataType'. |
| * |
| * @param measurementDataType raw measurement type |
| * @param aggregation aggregation type |
| * @return measurementDataType directly, or return a list whose elements are all the datatype of |
| * aggregation and its length is the same as 'measurementDataType' |
| */ |
| public static List<TSDataType> getAggregatedDataTypes( |
| List<TSDataType> measurementDataType, String aggregation) { |
| TSDataType dataType = getBuiltinAggregationTypeByFuncName(aggregation); |
| if (dataType != null) { |
| return Collections.nCopies(measurementDataType.size(), dataType); |
| } |
| return measurementDataType; |
| } |
| |
| public static TSDataType getSeriesTypeByPath(PartialPath path, String aggregation) { |
| TSDataType dataType = getBuiltinAggregationTypeByFuncName(aggregation); |
| if (dataType != null) { |
| return dataType; |
| } else { |
| return path.getSeriesType(); |
| } |
| } |
| |
| /** |
| * @param aggregation aggregation function |
| * @return the data type of the aggregation or null if it aggregation is null |
| */ |
| public static TSDataType getBuiltinAggregationTypeByFuncName(String aggregation) { |
| if (aggregation == null) { |
| return null; |
| } |
| switch (aggregation.toLowerCase()) { |
| case SqlConstant.MIN_TIME: |
| case SqlConstant.MAX_TIME: |
| case SqlConstant.COUNT: |
| case SqlConstant.TIME_DURATION: |
| case SqlConstant.COUNT_TIME: |
| return TSDataType.INT64; |
| case SqlConstant.AVG: |
| case SqlConstant.SUM: |
| case SqlConstant.STDDEV: |
| case SqlConstant.STDDEV_POP: |
| case SqlConstant.STDDEV_SAMP: |
| case SqlConstant.VARIANCE: |
| case SqlConstant.VAR_POP: |
| case SqlConstant.VAR_SAMP: |
| return TSDataType.DOUBLE; |
| // Partial aggregation names |
| case SqlConstant.STDDEV + "_partial": |
| case SqlConstant.STDDEV_POP + "_partial": |
| case SqlConstant.STDDEV_SAMP + "_partial": |
| case SqlConstant.VARIANCE + "_partial": |
| case SqlConstant.VAR_POP + "_partial": |
| case SqlConstant.VAR_SAMP + "_partial": |
| case SqlConstant.MAX_BY + "_partial": |
| case SqlConstant.MIN_BY + "_partial": |
| return TSDataType.TEXT; |
| case SqlConstant.LAST_VALUE: |
| case SqlConstant.FIRST_VALUE: |
| case SqlConstant.MIN_VALUE: |
| case SqlConstant.MAX_VALUE: |
| case SqlConstant.MODE: |
| case SqlConstant.MAX_BY: |
| case SqlConstant.MIN_BY: |
| default: |
| return null; |
| } |
| } |
| |
| /** |
| * Return aggregation function name by given function type. If aggregation type is UDAF, you shall |
| * acquire its name in other ways. |
| * |
| * @param aggregationType aggregation type |
| * @return the name of the aggregation or null if its aggregation type is null |
| */ |
| public static String getBuiltinAggregationName(TAggregationType aggregationType) { |
| if (aggregationType == null) { |
| return null; |
| } |
| switch (aggregationType) { |
| case COUNT: |
| return SqlConstant.COUNT; |
| case AVG: |
| return SqlConstant.AVG; |
| case SUM: |
| return SqlConstant.SUM; |
| case FIRST_VALUE: |
| return SqlConstant.FIRST_VALUE; |
| case LAST_VALUE: |
| return SqlConstant.LAST_VALUE; |
| case MAX_TIME: |
| return SqlConstant.MAX_TIME; |
| case MIN_TIME: |
| return SqlConstant.MIN_TIME; |
| case MAX_VALUE: |
| return SqlConstant.MAX_VALUE; |
| case MIN_VALUE: |
| return SqlConstant.MIN_VALUE; |
| case EXTREME: |
| return SqlConstant.EXTREME; |
| case COUNT_IF: |
| return SqlConstant.COUNT_IF; |
| case TIME_DURATION: |
| return SqlConstant.TIME_DURATION; |
| case MODE: |
| return SqlConstant.MODE; |
| case COUNT_TIME: |
| return SqlConstant.COUNT_TIME; |
| case STDDEV: |
| return SqlConstant.STDDEV; |
| case STDDEV_POP: |
| return SqlConstant.STDDEV_POP; |
| case STDDEV_SAMP: |
| return SqlConstant.STDDEV_SAMP; |
| case VARIANCE: |
| return SqlConstant.VARIANCE; |
| case VAR_POP: |
| return SqlConstant.VAR_POP; |
| case VAR_SAMP: |
| return SqlConstant.VAR_SAMP; |
| default: |
| return null; |
| } |
| } |
| |
| /** |
| * judge whether the order of aggregation calculation is consistent with the order of traversing |
| * data |
| */ |
| public static boolean isConsistentWithScanOrder( |
| TAggregationType aggregationFunction, Ordering scanOrder) { |
| boolean ascending = scanOrder == Ordering.ASC; |
| switch (aggregationFunction) { |
| case MIN_TIME: |
| case FIRST_VALUE: |
| return ascending; |
| case MAX_TIME: |
| case LAST_VALUE: |
| return !ascending; |
| case SUM: |
| case MIN_VALUE: |
| case MAX_VALUE: |
| case EXTREME: |
| case COUNT: |
| case COUNT_TIME: |
| case AVG: |
| case TIME_DURATION: |
| case STDDEV: |
| case STDDEV_POP: |
| case STDDEV_SAMP: |
| case VARIANCE: |
| case VAR_POP: |
| case VAR_SAMP: |
| case MAX_BY: |
| case MIN_BY: |
| case UDAF: |
| return true; |
| default: |
| throw new IllegalArgumentException( |
| String.format("Invalid Aggregation function: %s", aggregationFunction)); |
| } |
| } |
| |
| public static void checkDataTypeWithEncoding(TSDataType dataType, TSEncoding encoding) |
| throws MetadataException { |
| if (!schemaChecker.get(dataType).contains(encoding)) { |
| throw new MetadataException( |
| String.format("encoding %s does not support %s", encoding, dataType), true); |
| } |
| } |
| |
| public static List<String> splitPartialBuiltinAggregation(TAggregationType aggregationType) { |
| switch (aggregationType) { |
| case FIRST_VALUE: |
| return Collections.singletonList(SqlConstant.MIN_TIME); |
| case LAST_VALUE: |
| return Collections.singletonList(SqlConstant.MAX_TIME); |
| case STDDEV: |
| return Collections.singletonList(addPartialSuffix(SqlConstant.STDDEV)); |
| case STDDEV_POP: |
| return Collections.singletonList(addPartialSuffix(SqlConstant.STDDEV_POP)); |
| case STDDEV_SAMP: |
| return Collections.singletonList(addPartialSuffix(SqlConstant.STDDEV_SAMP)); |
| case VARIANCE: |
| return Collections.singletonList(addPartialSuffix(SqlConstant.VARIANCE)); |
| case VAR_POP: |
| return Collections.singletonList(addPartialSuffix(SqlConstant.VAR_POP)); |
| case VAR_SAMP: |
| return Collections.singletonList(addPartialSuffix(SqlConstant.VAR_SAMP)); |
| case MAX_BY: |
| return Collections.singletonList(addPartialSuffix(SqlConstant.MAX_BY)); |
| case MIN_BY: |
| return Collections.singletonList(addPartialSuffix(SqlConstant.MIN_BY)); |
| case AVG: |
| return Arrays.asList(SqlConstant.COUNT, SqlConstant.SUM); |
| case TIME_DURATION: |
| return Arrays.asList(SqlConstant.MAX_TIME, SqlConstant.MIN_TIME); |
| case SUM: |
| case MIN_VALUE: |
| case MAX_VALUE: |
| case EXTREME: |
| case COUNT: |
| case COUNT_TIME: |
| case MIN_TIME: |
| case MAX_TIME: |
| case COUNT_IF: |
| case MODE: |
| return Collections.emptyList(); |
| default: |
| throw new IllegalArgumentException( |
| String.format("Invalid Aggregation function: %s", aggregationType)); |
| } |
| } |
| } |