| /* |
| * Licensed to the Apache Software Foundation (ASF) under one |
| * or more contributor license agreements. See the NOTICE file |
| * distributed with this work for additional information |
| * regarding copyright ownership. The ASF licenses this file |
| * to you under the Apache License, Version 2.0 (the |
| * "License"); you may not use this file except in compliance |
| * with the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, |
| * software distributed under the License is distributed on an |
| * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
| * KIND, either express or implied. See the License for the |
| * specific language governing permissions and limitations |
| * under the License. |
| */ |
| |
| package org.apache.asterix.lang.common.statement; |
| |
| import java.util.List; |
| import java.util.Locale; |
| |
| import org.apache.asterix.common.exceptions.CompilationException; |
| import org.apache.asterix.common.exceptions.ErrorCode; |
| import org.apache.asterix.common.metadata.DataverseName; |
| import org.apache.asterix.common.metadata.Namespace; |
| import org.apache.asterix.lang.common.base.AbstractStatement; |
| import org.apache.asterix.lang.common.base.Expression; |
| import org.apache.asterix.lang.common.expression.FieldBinding; |
| import org.apache.asterix.lang.common.expression.RecordConstructor; |
| import org.apache.asterix.lang.common.util.ExpressionUtils; |
| import org.apache.asterix.lang.common.util.LangRecordParseUtil; |
| import org.apache.asterix.lang.common.visitor.base.ILangVisitor; |
| import org.apache.asterix.object.base.AdmBigIntNode; |
| import org.apache.asterix.object.base.AdmDoubleNode; |
| import org.apache.asterix.object.base.AdmObjectNode; |
| import org.apache.asterix.object.base.AdmStringNode; |
| import org.apache.asterix.object.base.IAdmNode; |
| import org.apache.asterix.om.types.BuiltinType; |
| import org.apache.hyracks.algebricks.common.exceptions.AlgebricksException; |
| |
| public class AnalyzeStatement extends AbstractStatement { |
| |
| private static final String SAMPLE_FIELD_NAME = "sample"; |
| private static final String SAMPLE_LOW = "low"; |
| private static final String SAMPLE_MEDIUM = "medium"; |
| private static final String SAMPLE_HIGH = "high"; |
| private static final int SAMPLE_LOW_SIZE = 1063; |
| private static final int SAMPLE_MEDIUM_SIZE = SAMPLE_LOW_SIZE * 4; |
| private static final int SAMPLE_HIGH_SIZE = SAMPLE_MEDIUM_SIZE * 4; |
| private static final int SAMPLE_DEFAULT_SIZE = SAMPLE_LOW_SIZE; |
| |
| private static final String SAMPLE_SEED_FIELD_NAME = "sample-seed"; |
| |
| private final Namespace namespace; |
| private final String datasetName; |
| private final AdmObjectNode options; |
| |
| public AnalyzeStatement(Namespace namespace, String datasetName, RecordConstructor options) |
| throws CompilationException { |
| this.namespace = namespace; |
| this.datasetName = datasetName; |
| this.options = options == null ? null : validateOptions(options); |
| } |
| |
| private static AdmObjectNode validateOptions(RecordConstructor options) throws CompilationException { |
| final List<FieldBinding> fbList = options.getFbList(); |
| for (int i = 0; i < fbList.size(); i++) { |
| FieldBinding binding = fbList.get(i); |
| String key = LangRecordParseUtil.exprToStringLiteral(binding.getLeftExpr()).getStringValue(); |
| Expression value = binding.getRightExpr(); |
| switch (key) { |
| case SAMPLE_FIELD_NAME: |
| if (value.getKind() != Expression.Kind.LITERAL_EXPRESSION) { |
| throw new CompilationException(ErrorCode.INVALID_SAMPLE_SIZE); |
| } |
| break; |
| case SAMPLE_SEED_FIELD_NAME: |
| if (value.getKind() != Expression.Kind.LITERAL_EXPRESSION |
| && value.getKind() != Expression.Kind.UNARY_EXPRESSION) { |
| throw new CompilationException(ErrorCode.INVALID_SAMPLE_SEED); |
| } |
| break; |
| default: |
| throw new CompilationException(ErrorCode.INVALID_PARAM, key); |
| } |
| } |
| return (ExpressionUtils.toNode(options)); |
| } |
| |
| @Override |
| public Kind getKind() { |
| return Kind.ANALYZE; |
| } |
| |
| public Namespace getNamespace() { |
| return namespace; |
| } |
| |
| public DataverseName getDataverseName() { |
| return namespace == null ? null : namespace.getDataverseName(); |
| } |
| |
| public String getDatasetName() { |
| return datasetName; |
| } |
| |
| public int getSampleSize() throws CompilationException { |
| IAdmNode n = getOption(SAMPLE_FIELD_NAME); |
| if (n == null) { |
| return SAMPLE_DEFAULT_SIZE; |
| } |
| switch (n.getType()) { |
| case STRING: |
| String s = ((AdmStringNode) n).get(); |
| switch (s.toLowerCase(Locale.ROOT)) { |
| case SAMPLE_LOW: |
| return SAMPLE_LOW_SIZE; |
| case SAMPLE_MEDIUM: |
| return SAMPLE_MEDIUM_SIZE; |
| case SAMPLE_HIGH: |
| return SAMPLE_HIGH_SIZE; |
| default: |
| throw new CompilationException(ErrorCode.INVALID_SAMPLE_SIZE); |
| } |
| case BIGINT: |
| int v = (int) ((AdmBigIntNode) n).get(); |
| if (!isValidSampleSize(v)) { |
| throw new CompilationException(ErrorCode.OUT_OF_RANGE_SAMPLE_SIZE, SAMPLE_LOW_SIZE, |
| SAMPLE_HIGH_SIZE); |
| } |
| return v; |
| case DOUBLE: |
| v = (int) ((AdmDoubleNode) n).get(); |
| if (!isValidSampleSize(v)) { |
| throw new CompilationException(ErrorCode.OUT_OF_RANGE_SAMPLE_SIZE, SAMPLE_LOW_SIZE, |
| SAMPLE_HIGH_SIZE); |
| } |
| return v; |
| default: |
| throw new CompilationException(ErrorCode.WITH_FIELD_MUST_BE_OF_TYPE, SAMPLE_FIELD_NAME, |
| BuiltinType.ASTRING.getTypeName(), n.getType().toString()); |
| } |
| } |
| |
| public long getOrCreateSampleSeed() throws AlgebricksException { |
| IAdmNode n = getOption(SAMPLE_SEED_FIELD_NAME); |
| return n != null ? getSampleSeed(n) : createSampleSeed(); |
| } |
| |
| private long getSampleSeed(IAdmNode n) throws CompilationException { |
| switch (n.getType()) { |
| case BIGINT: |
| return ((AdmBigIntNode) n).get(); |
| case DOUBLE: |
| return (long) ((AdmDoubleNode) n).get(); |
| case STRING: |
| String s = ((AdmStringNode) n).get(); |
| try { |
| return Long.parseLong(s); |
| } catch (NumberFormatException e) { |
| throw new CompilationException(ErrorCode.INVALID_SAMPLE_SEED); |
| } |
| default: |
| throw new CompilationException(ErrorCode.WITH_FIELD_MUST_BE_OF_TYPE, SAMPLE_SEED_FIELD_NAME, |
| BuiltinType.AINT64.getTypeName(), n.getType().toString()); |
| } |
| } |
| |
| private long createSampleSeed() { |
| return System.nanoTime() + System.identityHashCode(this); |
| } |
| |
| private boolean isValidSampleSize(int v) { |
| return v >= SAMPLE_LOW_SIZE && v <= SAMPLE_HIGH_SIZE; |
| } |
| |
| private IAdmNode getOption(String optionName) { |
| return options != null ? options.get(optionName) : null; |
| } |
| |
| @Override |
| public <R, T> R accept(ILangVisitor<R, T> visitor, T arg) throws CompilationException { |
| return visitor.visit(this, arg); |
| } |
| |
| @Override |
| public byte getCategory() { |
| return Category.DDL; |
| } |
| } |